crawlo 1.4.7__py3-none-any.whl → 1.4.8__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of crawlo might be problematic. Click here for more details.
- crawlo/__init__.py +90 -90
- crawlo/__version__.py +1 -1
- crawlo/cli.py +75 -75
- crawlo/commands/__init__.py +14 -14
- crawlo/commands/check.py +594 -594
- crawlo/commands/genspider.py +186 -186
- crawlo/commands/help.py +140 -140
- crawlo/commands/list.py +155 -155
- crawlo/commands/run.py +379 -379
- crawlo/commands/startproject.py +460 -460
- crawlo/commands/stats.py +187 -187
- crawlo/commands/utils.py +196 -196
- crawlo/config.py +320 -320
- crawlo/config_validator.py +277 -277
- crawlo/core/__init__.py +52 -52
- crawlo/core/engine.py +451 -451
- crawlo/core/processor.py +47 -47
- crawlo/core/scheduler.py +290 -290
- crawlo/crawler.py +698 -698
- crawlo/data/__init__.py +5 -5
- crawlo/data/user_agents.py +194 -194
- crawlo/downloader/__init__.py +280 -280
- crawlo/downloader/aiohttp_downloader.py +233 -233
- crawlo/downloader/cffi_downloader.py +250 -250
- crawlo/downloader/httpx_downloader.py +265 -265
- crawlo/downloader/hybrid_downloader.py +212 -212
- crawlo/downloader/playwright_downloader.py +425 -425
- crawlo/downloader/selenium_downloader.py +486 -486
- crawlo/event.py +45 -45
- crawlo/exceptions.py +214 -214
- crawlo/extension/__init__.py +64 -64
- crawlo/extension/health_check.py +141 -141
- crawlo/extension/log_interval.py +94 -94
- crawlo/extension/log_stats.py +70 -70
- crawlo/extension/logging_extension.py +53 -53
- crawlo/extension/memory_monitor.py +104 -104
- crawlo/extension/performance_profiler.py +133 -133
- crawlo/extension/request_recorder.py +107 -107
- crawlo/factories/__init__.py +27 -27
- crawlo/factories/base.py +68 -68
- crawlo/factories/crawler.py +104 -104
- crawlo/factories/registry.py +84 -84
- crawlo/factories/utils.py +134 -134
- crawlo/filters/__init__.py +170 -170
- crawlo/filters/aioredis_filter.py +347 -347
- crawlo/filters/memory_filter.py +261 -261
- crawlo/framework.py +306 -306
- crawlo/initialization/__init__.py +44 -44
- crawlo/initialization/built_in.py +391 -391
- crawlo/initialization/context.py +141 -141
- crawlo/initialization/core.py +240 -240
- crawlo/initialization/phases.py +229 -229
- crawlo/initialization/registry.py +143 -143
- crawlo/initialization/utils.py +48 -48
- crawlo/interfaces.py +23 -23
- crawlo/items/__init__.py +23 -23
- crawlo/items/base.py +23 -23
- crawlo/items/fields.py +52 -52
- crawlo/items/items.py +104 -104
- crawlo/logging/__init__.py +42 -42
- crawlo/logging/config.py +280 -276
- crawlo/logging/factory.py +175 -175
- crawlo/logging/manager.py +104 -104
- crawlo/middleware/__init__.py +87 -87
- crawlo/middleware/default_header.py +132 -132
- crawlo/middleware/download_delay.py +104 -104
- crawlo/middleware/middleware_manager.py +142 -142
- crawlo/middleware/offsite.py +123 -123
- crawlo/middleware/proxy.py +209 -209
- crawlo/middleware/request_ignore.py +86 -86
- crawlo/middleware/response_code.py +150 -150
- crawlo/middleware/response_filter.py +136 -136
- crawlo/middleware/retry.py +124 -124
- crawlo/mode_manager.py +287 -287
- crawlo/network/__init__.py +21 -21
- crawlo/network/request.py +408 -376
- crawlo/network/response.py +598 -569
- crawlo/pipelines/__init__.py +52 -52
- crawlo/pipelines/base_pipeline.py +452 -452
- crawlo/pipelines/bloom_dedup_pipeline.py +145 -146
- crawlo/pipelines/console_pipeline.py +39 -39
- crawlo/pipelines/csv_pipeline.py +316 -316
- crawlo/pipelines/database_dedup_pipeline.py +196 -197
- crawlo/pipelines/json_pipeline.py +218 -218
- crawlo/pipelines/memory_dedup_pipeline.py +104 -105
- crawlo/pipelines/mongo_pipeline.py +140 -139
- crawlo/pipelines/mysql_pipeline.py +468 -469
- crawlo/pipelines/pipeline_manager.py +100 -100
- crawlo/pipelines/redis_dedup_pipeline.py +155 -155
- crawlo/project.py +347 -347
- crawlo/queue/__init__.py +9 -9
- crawlo/queue/pqueue.py +38 -38
- crawlo/queue/queue_manager.py +591 -591
- crawlo/queue/redis_priority_queue.py +518 -518
- crawlo/settings/__init__.py +7 -7
- crawlo/settings/default_settings.py +287 -284
- crawlo/settings/setting_manager.py +219 -219
- crawlo/spider/__init__.py +658 -657
- crawlo/stats_collector.py +81 -81
- crawlo/subscriber.py +129 -129
- crawlo/task_manager.py +138 -138
- crawlo/templates/crawlo.cfg.tmpl +10 -10
- crawlo/templates/project/__init__.py.tmpl +1 -1
- crawlo/templates/project/items.py.tmpl +13 -13
- crawlo/templates/project/middlewares.py.tmpl +38 -38
- crawlo/templates/project/pipelines.py.tmpl +35 -35
- crawlo/templates/project/settings.py.tmpl +113 -109
- crawlo/templates/project/settings_distributed.py.tmpl +160 -156
- crawlo/templates/project/settings_gentle.py.tmpl +174 -170
- crawlo/templates/project/settings_high_performance.py.tmpl +175 -171
- crawlo/templates/project/settings_minimal.py.tmpl +102 -98
- crawlo/templates/project/settings_simple.py.tmpl +172 -168
- crawlo/templates/project/spiders/__init__.py.tmpl +9 -9
- crawlo/templates/run.py.tmpl +23 -23
- crawlo/templates/spider/spider.py.tmpl +32 -32
- crawlo/templates/spiders_init.py.tmpl +4 -4
- crawlo/tools/__init__.py +86 -86
- crawlo/tools/date_tools.py +289 -289
- crawlo/tools/distributed_coordinator.py +384 -384
- crawlo/tools/scenario_adapter.py +262 -262
- crawlo/tools/text_cleaner.py +232 -232
- crawlo/utils/__init__.py +74 -50
- crawlo/utils/batch_processor.py +276 -276
- crawlo/utils/config_manager.py +442 -442
- crawlo/utils/controlled_spider_mixin.py +439 -439
- crawlo/utils/db_helper.py +250 -250
- crawlo/utils/encoding_helper.py +190 -0
- crawlo/utils/error_handler.py +410 -410
- crawlo/utils/fingerprint.py +121 -121
- crawlo/utils/func_tools.py +82 -82
- crawlo/utils/large_scale_helper.py +344 -344
- crawlo/utils/leak_detector.py +335 -335
- crawlo/utils/misc.py +81 -81
- crawlo/utils/mongo_connection_pool.py +157 -157
- crawlo/utils/mysql_connection_pool.py +197 -197
- crawlo/utils/performance_monitor.py +285 -285
- crawlo/utils/queue_helper.py +175 -175
- crawlo/utils/redis_checker.py +90 -90
- crawlo/utils/redis_connection_pool.py +578 -578
- crawlo/utils/redis_key_validator.py +198 -198
- crawlo/utils/request.py +278 -278
- crawlo/utils/request_serializer.py +225 -225
- crawlo/utils/resource_manager.py +337 -337
- crawlo/utils/response_helper.py +113 -0
- crawlo/utils/selector_helper.py +138 -137
- crawlo/utils/singleton.py +69 -69
- crawlo/utils/spider_loader.py +201 -201
- crawlo/utils/text_helper.py +94 -94
- {crawlo-1.4.7.dist-info → crawlo-1.4.8.dist-info}/METADATA +831 -689
- crawlo-1.4.8.dist-info/RECORD +347 -0
- examples/__init__.py +7 -7
- tests/__init__.py +7 -7
- tests/advanced_tools_example.py +217 -217
- tests/authenticated_proxy_example.py +110 -110
- tests/baidu_performance_test.py +108 -108
- tests/baidu_test.py +59 -59
- tests/bug_check_test.py +250 -250
- tests/cleaners_example.py +160 -160
- tests/comprehensive_framework_test.py +212 -212
- tests/comprehensive_test.py +81 -81
- tests/comprehensive_testing_summary.md +186 -186
- tests/config_validation_demo.py +142 -142
- tests/controlled_spider_example.py +205 -205
- tests/date_tools_example.py +180 -180
- tests/debug_configure.py +69 -69
- tests/debug_framework_logger.py +84 -84
- tests/debug_log_config.py +126 -126
- tests/debug_log_levels.py +63 -63
- tests/debug_pipelines.py +66 -66
- tests/detailed_log_test.py +233 -233
- tests/direct_selector_helper_test.py +96 -96
- tests/distributed_dedup_test.py +467 -467
- tests/distributed_test.py +66 -66
- tests/distributed_test_debug.py +76 -76
- tests/dynamic_loading_example.py +523 -523
- tests/dynamic_loading_test.py +104 -104
- tests/error_handling_example.py +171 -171
- tests/explain_mysql_update_behavior.py +76 -76
- tests/final_comprehensive_test.py +151 -151
- tests/final_log_test.py +260 -260
- tests/final_validation_test.py +182 -182
- tests/fix_log_test.py +142 -142
- tests/framework_performance_test.py +202 -202
- tests/log_buffering_test.py +111 -111
- tests/log_generation_timing_test.py +153 -153
- tests/monitor_redis_dedup.sh +72 -72
- tests/ofweek_scrapy/ofweek_scrapy/items.py +12 -12
- tests/ofweek_scrapy/ofweek_scrapy/middlewares.py +100 -100
- tests/ofweek_scrapy/ofweek_scrapy/pipelines.py +13 -13
- tests/ofweek_scrapy/ofweek_scrapy/settings.py +84 -84
- tests/ofweek_scrapy/ofweek_scrapy/spiders/__init__.py +4 -4
- tests/ofweek_scrapy/scrapy.cfg +11 -11
- tests/optimized_performance_test.py +211 -211
- tests/performance_comparison.py +244 -244
- tests/queue_blocking_test.py +113 -113
- tests/queue_test.py +89 -89
- tests/redis_key_validation_demo.py +130 -130
- tests/request_params_example.py +150 -150
- tests/response_improvements_example.py +144 -144
- tests/scrapy_comparison/ofweek_scrapy.py +138 -138
- tests/scrapy_comparison/scrapy_test.py +133 -133
- tests/simple_cli_test.py +54 -54
- tests/simple_command_test.py +119 -119
- tests/simple_crawlo_test.py +126 -126
- tests/simple_follow_test.py +38 -38
- tests/simple_log_test2.py +137 -137
- tests/simple_optimization_test.py +128 -128
- tests/simple_queue_type_test.py +41 -41
- tests/simple_response_selector_test.py +94 -94
- tests/simple_selector_helper_test.py +154 -154
- tests/simple_selector_test.py +207 -207
- tests/simple_spider_test.py +49 -49
- tests/simple_url_test.py +73 -73
- tests/simulate_mysql_update_test.py +139 -139
- tests/spider_log_timing_test.py +177 -177
- tests/test_advanced_tools.py +148 -148
- tests/test_all_commands.py +230 -230
- tests/test_all_pipeline_fingerprints.py +133 -133
- tests/test_all_redis_key_configs.py +145 -145
- tests/test_asyncmy_usage.py +56 -56
- tests/test_batch_processor.py +178 -178
- tests/test_cleaners.py +54 -54
- tests/test_cli_arguments.py +118 -118
- tests/test_component_factory.py +174 -174
- tests/test_config_consistency.py +80 -80
- tests/test_config_merge.py +152 -152
- tests/test_config_validator.py +182 -182
- tests/test_controlled_spider_mixin.py +79 -79
- tests/test_crawler_process_import.py +38 -38
- tests/test_crawler_process_spider_modules.py +47 -47
- tests/test_crawlo_proxy_integration.py +114 -114
- tests/test_date_tools.py +123 -123
- tests/test_dedup_fix.py +220 -220
- tests/test_dedup_pipeline_consistency.py +124 -124
- tests/test_default_header_middleware.py +313 -313
- tests/test_distributed.py +65 -65
- tests/test_double_crawlo_fix.py +204 -204
- tests/test_double_crawlo_fix_simple.py +124 -124
- tests/test_download_delay_middleware.py +221 -221
- tests/test_downloader_proxy_compatibility.py +272 -272
- tests/test_edge_cases.py +305 -305
- tests/test_encoding_core.py +56 -56
- tests/test_encoding_detection.py +126 -126
- tests/test_enhanced_error_handler.py +270 -270
- tests/test_enhanced_error_handler_comprehensive.py +245 -245
- tests/test_error_handler_compatibility.py +112 -112
- tests/test_factories.py +252 -252
- tests/test_factory_compatibility.py +196 -196
- tests/test_final_validation.py +153 -153
- tests/test_fingerprint_consistency.py +135 -135
- tests/test_fingerprint_simple.py +51 -51
- tests/test_get_component_logger.py +83 -83
- tests/test_hash_performance.py +99 -99
- tests/test_integration.py +169 -169
- tests/test_item_dedup_redis_key.py +122 -122
- tests/test_large_scale_helper.py +235 -235
- tests/test_logging_enhancements.py +374 -374
- tests/test_logging_final.py +184 -184
- tests/test_logging_integration.py +312 -312
- tests/test_logging_system.py +282 -282
- tests/test_middleware_debug.py +141 -141
- tests/test_mode_consistency.py +51 -51
- tests/test_multi_directory.py +67 -67
- tests/test_multiple_spider_modules.py +80 -80
- tests/test_mysql_pipeline_config.py +164 -164
- tests/test_mysql_pipeline_error.py +98 -98
- tests/test_mysql_pipeline_init_log.py +82 -82
- tests/test_mysql_pipeline_integration.py +132 -132
- tests/test_mysql_pipeline_refactor.py +143 -143
- tests/test_mysql_pipeline_refactor_simple.py +85 -85
- tests/test_mysql_pipeline_robustness.py +195 -195
- tests/test_mysql_pipeline_types.py +88 -88
- tests/test_mysql_update_columns.py +93 -93
- tests/test_offsite_middleware.py +244 -244
- tests/test_offsite_middleware_simple.py +203 -203
- tests/test_optimized_selector_naming.py +100 -100
- tests/test_parsel.py +29 -29
- tests/test_performance.py +327 -327
- tests/test_performance_monitor.py +115 -115
- tests/test_pipeline_fingerprint_consistency.py +86 -86
- tests/test_priority_behavior.py +211 -211
- tests/test_priority_consistency.py +151 -151
- tests/test_priority_consistency_fixed.py +249 -249
- tests/test_proxy_health_check.py +32 -32
- tests/test_proxy_middleware.py +217 -217
- tests/test_proxy_middleware_enhanced.py +212 -212
- tests/test_proxy_middleware_integration.py +142 -142
- tests/test_proxy_middleware_refactored.py +207 -207
- tests/test_proxy_only.py +83 -83
- tests/test_proxy_providers.py +56 -56
- tests/test_proxy_stats.py +19 -19
- tests/test_proxy_strategies.py +59 -59
- tests/test_proxy_with_downloader.py +152 -152
- tests/test_queue_empty_check.py +41 -41
- tests/test_queue_manager_double_crawlo.py +173 -173
- tests/test_queue_manager_redis_key.py +179 -179
- tests/test_queue_naming.py +154 -154
- tests/test_queue_type.py +106 -106
- tests/test_queue_type_redis_config_consistency.py +130 -130
- tests/test_random_headers_default.py +322 -322
- tests/test_random_headers_necessity.py +308 -308
- tests/test_random_user_agent.py +72 -72
- tests/test_redis_config.py +28 -28
- tests/test_redis_connection_pool.py +294 -294
- tests/test_redis_key_naming.py +181 -181
- tests/test_redis_key_validator.py +123 -123
- tests/test_redis_queue.py +224 -224
- tests/test_redis_queue_name_fix.py +175 -175
- tests/test_redis_queue_type_fallback.py +129 -129
- tests/test_request_ignore_middleware.py +182 -182
- tests/test_request_params.py +111 -111
- tests/test_request_serialization.py +70 -70
- tests/test_response_code_middleware.py +349 -349
- tests/test_response_filter_middleware.py +427 -427
- tests/test_response_follow.py +104 -104
- tests/test_response_improvements.py +152 -152
- tests/test_response_selector_methods.py +92 -92
- tests/test_response_url_methods.py +70 -70
- tests/test_response_urljoin.py +86 -86
- tests/test_retry_middleware.py +333 -333
- tests/test_retry_middleware_realistic.py +273 -273
- tests/test_scheduler.py +252 -252
- tests/test_scheduler_config_update.py +133 -133
- tests/test_scrapy_style_encoding.py +112 -112
- tests/test_selector_helper.py +100 -100
- tests/test_selector_optimizations.py +146 -146
- tests/test_simple_response.py +61 -61
- tests/test_spider_loader.py +49 -49
- tests/test_spider_loader_comprehensive.py +69 -69
- tests/test_spider_modules.py +84 -84
- tests/test_spiders/test_spider.py +9 -9
- tests/test_telecom_spider_redis_key.py +205 -205
- tests/test_template_content.py +87 -87
- tests/test_template_redis_key.py +134 -134
- tests/test_tools.py +159 -159
- tests/test_user_agent_randomness.py +176 -176
- tests/test_user_agents.py +96 -96
- tests/untested_features_report.md +138 -138
- tests/verify_debug.py +51 -51
- tests/verify_distributed.py +117 -117
- tests/verify_log_fix.py +111 -111
- tests/verify_mysql_warnings.py +109 -109
- crawlo/utils/log.py +0 -80
- crawlo/utils/url_utils.py +0 -40
- crawlo-1.4.7.dist-info/RECORD +0 -347
- {crawlo-1.4.7.dist-info → crawlo-1.4.8.dist-info}/WHEEL +0 -0
- {crawlo-1.4.7.dist-info → crawlo-1.4.8.dist-info}/entry_points.txt +0 -0
- {crawlo-1.4.7.dist-info → crawlo-1.4.8.dist-info}/top_level.txt +0 -0
|
@@ -0,0 +1,347 @@
|
|
|
1
|
+
crawlo/__init__.py,sha256=weXNnBkBDN3htDD9LyVo2pJWYW8cPDhC2MwzYIA-Y9Y,2205
|
|
2
|
+
crawlo/__version__.py,sha256=_9NYs3PyBz_2XOfnTsADFo2yWVgtsIhY2vyJebGs93E,23
|
|
3
|
+
crawlo/cli.py,sha256=zbhj9RJ06C18Lc6sQjehgM3ViCBRiWh3CxtYbJeOtQc,2428
|
|
4
|
+
crawlo/config.py,sha256=VRAgw00OnSFLtowD41DOm9faXxuQuymzKWDM3eeQnkY,10052
|
|
5
|
+
crawlo/config_validator.py,sha256=YLE5JUZ-hQrWhX8_4Iq8zf7BaYl-rhG7aO-edstVFpE,11514
|
|
6
|
+
crawlo/crawler.py,sha256=13eKFmXBZfJbxkOc1cKhfdENqiFDg86Aw6E0fpjzLYA,29331
|
|
7
|
+
crawlo/event.py,sha256=P3NtfWkgidoxEmJ4xo5uG_vhAUarnrGbi9GjkdH1pSc,1297
|
|
8
|
+
crawlo/exceptions.py,sha256=B1LQsvXyOBl3GkXaUc_jMkcqB4Z_E3DNdBE4z2n3PrM,5281
|
|
9
|
+
crawlo/framework.py,sha256=yJDOdEfK7Rldga6R1jWje1P2tfHhv_-PaGeokpQ35Wk,10037
|
|
10
|
+
crawlo/interfaces.py,sha256=q1vwMSiZLfLpPhFa9Y0hAcjYEKvLkW2fZ2fmoAZ-5TE,653
|
|
11
|
+
crawlo/mode_manager.py,sha256=bbv4sdpLXoIjdIuHrJlys-AGHVND1Fr7sJaoV6kQdyc,10026
|
|
12
|
+
crawlo/project.py,sha256=nNnhwIjYxx6R7M25Wr7QDloynYJHJS2cyUrd98Rr_gc,13996
|
|
13
|
+
crawlo/stats_collector.py,sha256=8BlR5SKMTuTpCO_mtTxSYfZ80bCEe8SUJrWbS7UyphE,2793
|
|
14
|
+
crawlo/subscriber.py,sha256=h8fx69NJZeWem0ZkCmfHAi2kgfDGFObHpwN0aGNUM6Y,5115
|
|
15
|
+
crawlo/task_manager.py,sha256=KuExi62Z_ns5qQk-TCVfMlVBcK6mBC4-RYxGlcOKxm4,5964
|
|
16
|
+
crawlo/commands/__init__.py,sha256=orvY6wLOBwGUEJKeF3h_T1fxj8AaQLjngBDd-3xKOE4,392
|
|
17
|
+
crawlo/commands/check.py,sha256=Qz7c5k7BeBgD9GmA6rgIS1VP5eq-gCyDKFsSpqPZyx0,23197
|
|
18
|
+
crawlo/commands/genspider.py,sha256=JB4ZuFpKsYwtjx3DSsxugH7e3kqxhDWPG5ZKfvM0isI,6041
|
|
19
|
+
crawlo/commands/help.py,sha256=VzYmVpsTUZIFxJXu0iS0oVDCLmjdlNzVtYkqg4kIOzA,5322
|
|
20
|
+
crawlo/commands/list.py,sha256=MaiaJcrasvzDX-sawzCRk4j1VMJR4IgBT66aczpXGZ0,5875
|
|
21
|
+
crawlo/commands/run.py,sha256=VHtgSMtjvD6srw1un07iu54owWYbJWhG_yfZf_bv0QA,14722
|
|
22
|
+
crawlo/commands/startproject.py,sha256=boZrMyn6TgCi1jt3D3DQfui6hJitjwNO8mqlWKNOBns,17366
|
|
23
|
+
crawlo/commands/stats.py,sha256=TC_uVi9IYKuvBcGJtduUJPzaWGFN9ZWrNv_YUqg6b6s,6199
|
|
24
|
+
crawlo/commands/utils.py,sha256=YVNEEzlm_qNY3SVvU8h6o2lQMkVgypvoB4ZFrP4gln0,5578
|
|
25
|
+
crawlo/core/__init__.py,sha256=BWkj3AqZwp2Bk73UzUlC_qsqv_MH_HNrzy4DY1hosj4,1330
|
|
26
|
+
crawlo/core/engine.py,sha256=qKUYlEB9BhdUngKX85IVQMGPcSDVRnuldLSdmJERSWM,20090
|
|
27
|
+
crawlo/core/processor.py,sha256=GpmhrtB-plp3XwckdrcibdkTn0REE9uhOl5aPcQzLtY,1555
|
|
28
|
+
crawlo/core/scheduler.py,sha256=ldkF1KwGo4LsSldGa-clS8n1UZQBItrn757ZChGyb20,13980
|
|
29
|
+
crawlo/data/__init__.py,sha256=UPqgioMdu3imSUmpLWzVlpvoBnEfaPSAT-crCcWd7iw,121
|
|
30
|
+
crawlo/data/user_agents.py,sha256=zjjFkldQkqtrn45j0WZplaZLannPxZDeAU0JofxQcBc,9891
|
|
31
|
+
crawlo/downloader/__init__.py,sha256=wa5AY9XlWFTkZi2VBZ0hThwuPJZYdYjjHMU7nPvfmFw,9078
|
|
32
|
+
crawlo/downloader/aiohttp_downloader.py,sha256=aqmkFGcp0yFo9JdxB1UKWMVNDHGpvdRUZrM_IXZb8H4,9069
|
|
33
|
+
crawlo/downloader/cffi_downloader.py,sha256=410FOS3T6PXS4Vv6SH6I8tsOs4hVXsXny_oR4OP6M7s,10649
|
|
34
|
+
crawlo/downloader/httpx_downloader.py,sha256=BWqq-h63LYgnEWa7v0-Lwzof-lA9kREHWVkZRs7-PbY,12458
|
|
35
|
+
crawlo/downloader/hybrid_downloader.py,sha256=tXL7ceRWFrkh-YmUqVXBStjRqq0UsBjy-5NAltKOfvY,8203
|
|
36
|
+
crawlo/downloader/playwright_downloader.py,sha256=N1k7ZiRKnwhGSZnKbQ3M4SJzXJ5H-JG-nInpHHDhs3o,17622
|
|
37
|
+
crawlo/downloader/selenium_downloader.py,sha256=t5HU5utEmvLItn_Oou8a_ZGpzVZ-m_5QN7VJqh-TSdE,22151
|
|
38
|
+
crawlo/extension/__init__.py,sha256=viNq8fFDmSbvhmJUJX3-kUSikRKgFNDW8q-g8p2nsrg,2951
|
|
39
|
+
crawlo/extension/health_check.py,sha256=GL1JOuvnAPrdmmIY7uQ_YVdt0dIsYPtbof9OY75GLF8,5618
|
|
40
|
+
crawlo/extension/log_interval.py,sha256=eM6nN6-BQcGMtIAae9QSPJVK20ErzGtgriOZeVzq_j0,4462
|
|
41
|
+
crawlo/extension/log_stats.py,sha256=-CaNnBI4Ldaltjun6RyegSCIKuegfKO5xuA9nhsiXBo,2415
|
|
42
|
+
crawlo/extension/logging_extension.py,sha256=KALP8JxidozzYxD39bdkUL35HRTFdFqKYXatVKroNbU,2143
|
|
43
|
+
crawlo/extension/memory_monitor.py,sha256=dKSP6EkDnbGrv_ZSDjrHdNHMp9spDqJ9ZvvWC9dC-pk,4367
|
|
44
|
+
crawlo/extension/performance_profiler.py,sha256=SLzG9TioFO-SLyzd1-qNpsYWjc9sS4ybmza9jWzwdHg,5005
|
|
45
|
+
crawlo/extension/request_recorder.py,sha256=qRAaC9H67zr8Rp57cWqdtc21Re2XsCi49yhGWJk8uXU,4178
|
|
46
|
+
crawlo/factories/__init__.py,sha256=24dH70p05pZerO9-9gaKpTawRGeGvQYw7j5brvq8GUg,714
|
|
47
|
+
crawlo/factories/base.py,sha256=a8S5dhT7Pk2ybs34VAMmskIoa4svTcNy5KzF25tIELQ,1822
|
|
48
|
+
crawlo/factories/crawler.py,sha256=6fYbv-9UGLVmbnra-ZcXpDKYy7zKf9KhYw4GtPfxHp4,3170
|
|
49
|
+
crawlo/factories/registry.py,sha256=YU87CdsntOz609M0aQbGcCG9glPinUJxOn-_CaM4f-M,2595
|
|
50
|
+
crawlo/factories/utils.py,sha256=TIUCUjUTjh2lx5tmLdlKp1ai0C8YhF10--hY59YP-GY,4056
|
|
51
|
+
crawlo/filters/__init__.py,sha256=dKoMIZXl2W1qOsTGPW_RXB2o4DvHBFLDjkZnMxVdU5g,4982
|
|
52
|
+
crawlo/filters/aioredis_filter.py,sha256=BOiPalIMJRu_q85A6rfZKjq07m0Hi3KkDOZEIYffhBU,13752
|
|
53
|
+
crawlo/filters/memory_filter.py,sha256=CJX7P2QXy-k7wBycFfYL3_MUqqCWzIYIPpOqHUgrr6g,9227
|
|
54
|
+
crawlo/initialization/__init__.py,sha256=uNRMm9GccMYZi51scpvo-CPx_3ayp3Y81psBHlUoDfw,1132
|
|
55
|
+
crawlo/initialization/built_in.py,sha256=zODKOy6HQ1m3leG8MJg0WBKAmq-NTezL9FKY4mvSh6I,14833
|
|
56
|
+
crawlo/initialization/context.py,sha256=wG9t-M-Qttj7TN6gDumPX5Q5GHaPDUpLTZZDne2r3TE,4863
|
|
57
|
+
crawlo/initialization/core.py,sha256=sjjnzlivnuBkxVtOnEQL5YyaawYKXVDgUXyaj7dlfj4,8648
|
|
58
|
+
crawlo/initialization/phases.py,sha256=cqHBiN56a93OWrx1zRi_AsHiVoULG8-Xf9REA1Tr1NM,7171
|
|
59
|
+
crawlo/initialization/registry.py,sha256=u2AIjmsiyH13vD46RFFX5t86tOiDb1dQATOKa8JX5fI,4913
|
|
60
|
+
crawlo/initialization/utils.py,sha256=xuLIy9AUTgV23DB5UpDcRAtIMLRPWcdEUGYd0Exuf7k,1192
|
|
61
|
+
crawlo/items/__init__.py,sha256=rFpx1qFBo0Ik7bSdnXC8EVTJUOQdoJYGVdhYjaH00nk,409
|
|
62
|
+
crawlo/items/base.py,sha256=q0YTJlqUtizsqXwfWlk0ndcINV9dDyUckwMx8_JrkeY,602
|
|
63
|
+
crawlo/items/fields.py,sha256=l-DIwK6CCpdzNvf6ELz7Ckc7YCghZD9UCXA8vhNn2UE,1852
|
|
64
|
+
crawlo/items/items.py,sha256=OmVEvMmgofMU95GkaiWkfNQ2fjsH2fY9sw3SKcmUhLs,3478
|
|
65
|
+
crawlo/logging/__init__.py,sha256=D9qhyaHHxf6a8syEeqSu8uiV1fjiu0wH6mrZb544N8s,932
|
|
66
|
+
crawlo/logging/config.py,sha256=Ozouc320Y9_lFoDNqf1huL4_hN07LxEJwx4r5_l9-9g,11299
|
|
67
|
+
crawlo/logging/factory.py,sha256=3WtZcdmoypbPVpWlNHCBb45Fd-WR6y_U9y4SLR_CWKI,7019
|
|
68
|
+
crawlo/logging/manager.py,sha256=fF24ZiEPqCafpFF4e8wtZPg7SE93IcmMnVGcezbqWNM,2721
|
|
69
|
+
crawlo/middleware/__init__.py,sha256=YdPoIaPTom2r7kbTYsaNq841Idn1Fi54bs0MrkI8N-c,2269
|
|
70
|
+
crawlo/middleware/default_header.py,sha256=MAFK29Z5AVDtP5McaxTeU45BYaFm0Cxs9fRyF0J0pKg,5151
|
|
71
|
+
crawlo/middleware/download_delay.py,sha256=OVJ0Mii8bvJgbv-faeHfKp_fs2lob2vvoKw7aAfnYUA,3529
|
|
72
|
+
crawlo/middleware/middleware_manager.py,sha256=bhVkfqE1q-VGuGax3pBgjQmsPfzNLz8-pnXF6Y7fDd4,6626
|
|
73
|
+
crawlo/middleware/offsite.py,sha256=ZfiYasOhKha_uPh72E_N4uL2NEvL4zO2RDJx7jJoSQU,4669
|
|
74
|
+
crawlo/middleware/proxy.py,sha256=gNeafGnYr21is4Lth5OrNLyH3aXxs9shBWMLZkM7APs,9578
|
|
75
|
+
crawlo/middleware/request_ignore.py,sha256=I2HwUQjRG95o7qksf0CfdhaWfypu7y9IhRo3dHKa0dM,2661
|
|
76
|
+
crawlo/middleware/response_code.py,sha256=mi20tfnaBCff4fmNJ4n8txgddNyK14hoYHYVWg0-y7Y,4520
|
|
77
|
+
crawlo/middleware/response_filter.py,sha256=pLoKadA4bANC1Hdw_QJkvsiF2jhepIlUAapVKhk7NDQ,4371
|
|
78
|
+
crawlo/middleware/retry.py,sha256=_xfqzirLsgFdxIIJrfjtxuW3mCnT6Ww1EF_VSh9jzAY,4246
|
|
79
|
+
crawlo/network/__init__.py,sha256=bvEnpEUBZJ79URfNZbsHhsBKna54hM2-x_BV8eotTA4,418
|
|
80
|
+
crawlo/network/request.py,sha256=VygsnSHZFdE1XqLdmF-An0_Eq2fC53mXNeCljuKpq7g,15344
|
|
81
|
+
crawlo/network/response.py,sha256=ckWUEYEkXlbWxoOslZSB1Rl4L9TFFouA7qkBaMAEj1c,21450
|
|
82
|
+
crawlo/pipelines/__init__.py,sha256=YJ5XQUJPZWR2yiNb4O7pTNfgrWnmNgZZlcgQ4wo9IOg,1476
|
|
83
|
+
crawlo/pipelines/base_pipeline.py,sha256=8bK9kV9-zfT-NaEi7vWDmMdryYeEWHjpypHs3RYQIi0,14839
|
|
84
|
+
crawlo/pipelines/bloom_dedup_pipeline.py,sha256=o36WsfaGrGu5pJL1ULFy3Ykb-YnBgWRvVyU7cM-inU0,5429
|
|
85
|
+
crawlo/pipelines/console_pipeline.py,sha256=1-rUglds9HRhPUHiWtP927-ryIOMPmgMWgEjzIpuBaY,1274
|
|
86
|
+
crawlo/pipelines/csv_pipeline.py,sha256=MP31vod41PU5DzPWVUl2uCp2GSH7W1NW0MES0U2iFOI,12392
|
|
87
|
+
crawlo/pipelines/database_dedup_pipeline.py,sha256=QHmb0vQC0ZkIEw6cq2F3mSxvRhkvDaP1BtNzGxP39oI,7260
|
|
88
|
+
crawlo/pipelines/json_pipeline.py,sha256=nW4BI6N7OCixcicdbbQquSgLUF3Z4dP3ktBRsLFRmOw,8487
|
|
89
|
+
crawlo/pipelines/memory_dedup_pipeline.py,sha256=6tgnBTr1zTs4uJQcwNthofg9QijNvgqTpqfvteIy0es,3562
|
|
90
|
+
crawlo/pipelines/mongo_pipeline.py,sha256=0iSlUlvjO5AsfuE5zHCKjL0YbhHR5OtZjIjvegNzr7c,6213
|
|
91
|
+
crawlo/pipelines/mysql_pipeline.py,sha256=ZCz1YE6OdjCPzhaCcFN2eBk37bxLXrFDZt-ceS93uks,23235
|
|
92
|
+
crawlo/pipelines/pipeline_manager.py,sha256=c1t-YcIspp7o09NEfaYSBSaUUIg2-0fJhjqvG7_3Jqw,4286
|
|
93
|
+
crawlo/pipelines/redis_dedup_pipeline.py,sha256=j_i9Tl3L7tt4Lkc4tLCIcY3tWMEvvVxDH1TYbbqUWzo,5914
|
|
94
|
+
crawlo/queue/__init__.py,sha256=wY-W_KLmjCbMGYUebmOcTh98JO28pTBH-7ifCAaXBXc,259
|
|
95
|
+
crawlo/queue/pqueue.py,sha256=bbgd3l1VfqYXfz-4VFaiWLmJit1LdB3qHalCtNqyrqI,1210
|
|
96
|
+
crawlo/queue/queue_manager.py,sha256=CjaA0C6HMaET2n_osFr2mxO_fzt8Oq9pOqQIPnt63r4,25059
|
|
97
|
+
crawlo/queue/redis_priority_queue.py,sha256=B9QYTczt12kc4QlZSt1_XyvqvefwesOV-rCUPr_KyXo,22471
|
|
98
|
+
crawlo/settings/__init__.py,sha256=NgYFLfk_Bw7h6KSoepJn_lMBSqVbCHebjKxaE3_eMgw,130
|
|
99
|
+
crawlo/settings/default_settings.py,sha256=xTOZAfle2TUVcMkP1m1XAB6MSg-RvCrJp1YvOB8aUEI,13485
|
|
100
|
+
crawlo/settings/setting_manager.py,sha256=yI1tGaludevxKGGZO3Pn4aYofrg2cwYwvMZCFC5PPZw,8595
|
|
101
|
+
crawlo/spider/__init__.py,sha256=91NbcZGUiKOgPpvu8QfsSE6_A2Gw2XQoaiTPxwP-8k8,21855
|
|
102
|
+
crawlo/templates/crawlo.cfg.tmpl,sha256=DfmftICPPsopFGkmOqTWo55PCLboUk5iyFBtGqD_V1g,212
|
|
103
|
+
crawlo/templates/run.py.tmpl,sha256=jr2T6vARwMEJ3v4WXkLH1X0-wDTnoOlJTW-q2255z9o,499
|
|
104
|
+
crawlo/templates/spiders_init.py.tmpl,sha256=QvPw4DxiIjzyue6JDgfFtmuRKrE-jmjlBbvDK10zQwY,109
|
|
105
|
+
crawlo/templates/project/__init__.py.tmpl,sha256=WI5rG7-4rvwmwJWoGCzAgiw4hH2mL6qCYp5GbgiqxJY,54
|
|
106
|
+
crawlo/templates/project/items.py.tmpl,sha256=DrNj48b1W54DmntTLwU--ow2Fw4wSKw8MAmV1K8Vh2E,236
|
|
107
|
+
crawlo/templates/project/middlewares.py.tmpl,sha256=QQlb_bIhurQx4ZOUge3pwHrNIN0Z7RXNXCwA52Hs0Sw,1096
|
|
108
|
+
crawlo/templates/project/pipelines.py.tmpl,sha256=b_c_xLUzxLx3z2rMS0JG4JagM6_s38dx-VDHV47HaLQ,845
|
|
109
|
+
crawlo/templates/project/settings.py.tmpl,sha256=Wcchnbehzg-BY7XCxnrOz-pUwm6PDThN2mp42a-z3iA,3759
|
|
110
|
+
crawlo/templates/project/settings_distributed.py.tmpl,sha256=CpL3TkXkXEk90rNAnQRCTvu8jKlkhOckCin8245bdQM,5514
|
|
111
|
+
crawlo/templates/project/settings_gentle.py.tmpl,sha256=T6tPA91KtmOU_oyosrt-Z5LZ73jT_HWBu2mT0FrRxjg,5840
|
|
112
|
+
crawlo/templates/project/settings_high_performance.py.tmpl,sha256=kTdFI_FF_gzYxxASHiXEtfv2ptOHSD6X5K5VHMxPYJs,5960
|
|
113
|
+
crawlo/templates/project/settings_minimal.py.tmpl,sha256=CE-bGRFs12EY3psa6o-F3HB78nBF_YeuhMbgYN9efN8,3461
|
|
114
|
+
crawlo/templates/project/settings_simple.py.tmpl,sha256=Z5nKJXfKVBgBpp4B5DeuyopMPLOcorJJ4Bu6UG8pams,5692
|
|
115
|
+
crawlo/templates/project/spiders/__init__.py.tmpl,sha256=llhcIItXpm0TlEeumeLwp4fcYv2NHl8Iru7tLhDhxiE,216
|
|
116
|
+
crawlo/templates/spider/spider.py.tmpl,sha256=MpnTd69yawJ11rqyYRApj3_InQf_gMzNqPfL5bF7UgM,887
|
|
117
|
+
crawlo/tools/__init__.py,sha256=fatgJTaA06jvINxsqn7yJ-QtnRpxc2eDLnDFTmE_ykI,1768
|
|
118
|
+
crawlo/tools/date_tools.py,sha256=QOT3W5MqcEQhVM3cTZYxu1MRfgX-TI4aF1RI9s0QbdE,9195
|
|
119
|
+
crawlo/tools/distributed_coordinator.py,sha256=kkRbRoxz7iXKI3AQElyTptDpYl352ErbSkM3wjSHVwU,12574
|
|
120
|
+
crawlo/tools/scenario_adapter.py,sha256=gBe1nQiVO6c9Lt7GkA25zyidX_jaXUHWLjKWBtvXz5A,9658
|
|
121
|
+
crawlo/tools/text_cleaner.py,sha256=UrMGcgRnJaufjmDKIDsRYKMA8znCAArHDgouttWPygk,6690
|
|
122
|
+
crawlo/utils/__init__.py,sha256=FFMqPPGW9oLHDIJoF-ImxHwCLL_CKe5rMmi87CShKMs,1511
|
|
123
|
+
crawlo/utils/batch_processor.py,sha256=yGAS-Gp4ZAUEE1O8DHlSVSG2qEhfa2_nlDiFxIZUfyU,9882
|
|
124
|
+
crawlo/utils/config_manager.py,sha256=Qgrtm1v3rdlm-VMCjJOnllxQAizRu1oU6bGOhX_GEv0,14111
|
|
125
|
+
crawlo/utils/controlled_spider_mixin.py,sha256=U8fmo4aMEghmgoPZ8ZAZFutM-VaMFs33VwFS5rRR1XQ,16934
|
|
126
|
+
crawlo/utils/db_helper.py,sha256=auS7KOBvXolpfO1a6McWHBt1PgcTD6FbkkjNdvdjS7s,8700
|
|
127
|
+
crawlo/utils/encoding_helper.py,sha256=4MjF1Nzllt-kqIqLGp4p415KukouNZbxTOacTEFWi1M,6016
|
|
128
|
+
crawlo/utils/error_handler.py,sha256=Wm4fieywfR4M39v7GR0Tj2WTBcOQ8Mjf6PY5VF8VNTc,16234
|
|
129
|
+
crawlo/utils/fingerprint.py,sha256=3IbctH3zwyBjN_12SH7-vrFt-akA2WSo3iAzHc6u--s,3689
|
|
130
|
+
crawlo/utils/func_tools.py,sha256=y-TYP9H3X67MS_foWy9Z2LIS6GP7Y4Cy3T168ulq3Jc,2451
|
|
131
|
+
crawlo/utils/large_scale_helper.py,sha256=pHu4597lVtycvNwJXbw1IWCF6U7L8pMzWwBSwEZl-Fk,12450
|
|
132
|
+
crawlo/utils/leak_detector.py,sha256=7ycQEpVRglYUdueOzY-Kkt1mQK8nk0wbDRVO9uo4jhw,11922
|
|
133
|
+
crawlo/utils/misc.py,sha256=m_TbfMf4Aoe70zmkv7XWyFg8Rz0qOYPXepwB6EcYr7Y,2519
|
|
134
|
+
crawlo/utils/mongo_connection_pool.py,sha256=CCWsgF82LzQSBBlNJAW2AfWosw13sqOQbGXfKKNoFGk,6046
|
|
135
|
+
crawlo/utils/mysql_connection_pool.py,sha256=xNCGvZV1ytnejPmxISb4uDVqdCeGz4PNXXtpkcBz7yc,7254
|
|
136
|
+
crawlo/utils/performance_monitor.py,sha256=QevfmkIbu0Ox3kd7eiH_IIWiFy1zfNcqOlnBH8OhdLE,9830
|
|
137
|
+
crawlo/utils/queue_helper.py,sha256=gFmkh1jKlIcN1rmo2Jl6vYcLP5ByUWlfHO9eNlZPBLs,4918
|
|
138
|
+
crawlo/utils/redis_checker.py,sha256=XP05VK8dpFYYt8p3eK2tiNskmSCQXJAshuJ-BqsqV-U,2639
|
|
139
|
+
crawlo/utils/redis_connection_pool.py,sha256=DWqcusN6jfFn9YA7kuhVNsLZr4P0bOIFXUaYqTueewQ,21397
|
|
140
|
+
crawlo/utils/redis_key_validator.py,sha256=v7pat8g30MyqQDaXJbDDH4CS8irmu0ijTGZRfm7nh7g,5807
|
|
141
|
+
crawlo/utils/request.py,sha256=mMDo85uEbjLYJ-Np2VT0GMeXD7L8IYY4eIV98lIspYU,9438
|
|
142
|
+
crawlo/utils/request_serializer.py,sha256=zuH2_AhSZDVDmKUo6NrfG6kt4ZsbBict9pUf7CZvaM8,8929
|
|
143
|
+
crawlo/utils/resource_manager.py,sha256=SoZV7Z980HZaDazchUY8fc8J481VGPrgW18bqFzIZAs,11209
|
|
144
|
+
crawlo/utils/response_helper.py,sha256=YJYnK_NYWEIm7iF9rfgU-xB2WvGfJo28MGYRWao-Ghs,3392
|
|
145
|
+
crawlo/utils/selector_helper.py,sha256=kfqgy3ZV0RuGE_I8sNqQemr1XuJYBmM1Hkk7CD61HzU,4314
|
|
146
|
+
crawlo/utils/singleton.py,sha256=oXtNVB1_yTBv1Hvq8_jU_X3eKMKmQ21Kl0G9SS1vcWc,1892
|
|
147
|
+
crawlo/utils/spider_loader.py,sha256=CVyzuVmMFZ02ur8USna3jZNyMrhFUdPKoatnbDkOnSc,7675
|
|
148
|
+
crawlo/utils/text_helper.py,sha256=gYIrkH4_vFHbKZH9m6d1BVO5dqRqUccJqSWMdgVOb4g,2918
|
|
149
|
+
examples/__init__.py,sha256=NkRbV8_S1tb8S2AW6BE2U6P2-eGOPwMR1k0YQAwQpSE,130
|
|
150
|
+
tests/__init__.py,sha256=409aRX8hsPffiZCVjOogtxwhACzBp8G2UTJyUQSxhK0,136
|
|
151
|
+
tests/advanced_tools_example.py,sha256=W_QLm62QJGDSsjTi1ZrTfzrwfakk21PF_iOQvraBc94,7031
|
|
152
|
+
tests/authenticated_proxy_example.py,sha256=ZgLrU-1GaBhkJK1Wy0X93lHP1GT2sU2_wi3RI1CfrVc,3135
|
|
153
|
+
tests/baidu_performance_test.py,sha256=wxdaI7UwKboMYH_qcaqZLxAStvndH60bvKGzD8F-jaI,3974
|
|
154
|
+
tests/baidu_test.py,sha256=NKYnwDbPJX3tmKtRn7uQ_QWzUXiLTQC-Gdr1cQkJzEo,1874
|
|
155
|
+
tests/bug_check_test.py,sha256=EIDOUk_QgtBOWKuBLm_WHbgJ0fsDuJACJ-nuxnBIdkQ,8056
|
|
156
|
+
tests/cleaners_example.py,sha256=blVqSJ7SeWUNd17JjHZJgVTzWH65XKevLyaMB_Wg8qA,5324
|
|
157
|
+
tests/comprehensive_framework_test.py,sha256=_1N-OGbKvBTNachNvIjkL_izr4uv6OUybUkhxxz5MAk,5977
|
|
158
|
+
tests/comprehensive_test.py,sha256=wypCaB56IV8w8nd5VA5LSXUQ3IgLf0AKKUiCci6yEJQ,2969
|
|
159
|
+
tests/comprehensive_testing_summary.md,sha256=S01gclEas5oDhSLjxT_mOoeMl8FE4NMA-gveQOrIS4g,6513
|
|
160
|
+
tests/config_validation_demo.py,sha256=jbZ7h-HGsJmuqBb1euB_AhmKjllkvPmItRF1K0MQrVM,4171
|
|
161
|
+
tests/controlled_spider_example.py,sha256=2SAQKoREGHe-OzVaSkGpopCcrou6QXmeW7rLdmsyopw,7981
|
|
162
|
+
tests/date_tools_example.py,sha256=XI3iFEzeo7Nb5YepK8WHytIaBegtxWVSISpqQgpV6M8,5042
|
|
163
|
+
tests/debug_configure.py,sha256=9VZRJtA0u_SbCC_ZMdsiT9raseRE-C2spZpZuXZNysI,2213
|
|
164
|
+
tests/debug_framework_logger.py,sha256=p-dfOjEipjXQd6yk75S-SMoepzwujiwuv3rNwNSyjow,3413
|
|
165
|
+
tests/debug_log_config.py,sha256=cPS6qOLnynYTFOxpjcy9OUgIqrkasWb9f2c_PASc2_E,3714
|
|
166
|
+
tests/debug_log_levels.py,sha256=CZWG3KGDq-hYJ5TPhoZTyjKFKkkM-AoK3oP1w-JC1sc,2168
|
|
167
|
+
tests/debug_pipelines.py,sha256=FMb36bH9lQxBLb-nM579hBRK1S16Vxu1t_BC3Dj8O2w,2164
|
|
168
|
+
tests/detailed_log_test.py,sha256=oTCFF_Un7Jq2gV4rpRDFOxlHJSthnQhvEf0CSItfB7I,7501
|
|
169
|
+
tests/direct_selector_helper_test.py,sha256=p7_x3x87JUnpKplmwYO4zN5ympcPJSPdHsviso-LmpI,2862
|
|
170
|
+
tests/distributed_dedup_test.py,sha256=EaRnWH3ADsJN67Kn7T5TYPiQyMvyRtV6OCPk1uUTXQM,16507
|
|
171
|
+
tests/distributed_test.py,sha256=u6cEiymZzCItaTClKTxwVjNmOj9_PZii4_eGNAVMDW8,1825
|
|
172
|
+
tests/distributed_test_debug.py,sha256=pUv6ZKEJ5pK9xOA7lgVk6WW3cBAtnb1bsuZzJ8oGLvY,2181
|
|
173
|
+
tests/dynamic_loading_example.py,sha256=7LdeQZFevrb-U1_dgr4oX3aYo2Da4HvE_0KIf1fw4Ew,18786
|
|
174
|
+
tests/dynamic_loading_test.py,sha256=dzDW7b66HeDsIYsYgvNRihE3V6b6gEbUGQpp-eJbcIM,3413
|
|
175
|
+
tests/error_handling_example.py,sha256=grTeo1X17rFz4lhgASb0g5yu4NWbmNz5neyuonnNR40,5294
|
|
176
|
+
tests/explain_mysql_update_behavior.py,sha256=uBrJwiYujTJF35oF1kYMRjYU5k5Y3YlqOfOni0oPQtY,2865
|
|
177
|
+
tests/final_comprehensive_test.py,sha256=szTNbtwKfYNmE0kzDPCsE_kvnTG7FNKl2JERakGhKIk,4314
|
|
178
|
+
tests/final_log_test.py,sha256=CpZ4ZvvuvFiBvz1a50qN599XIU086ett_I0bSX42BLU,9367
|
|
179
|
+
tests/final_validation_test.py,sha256=4cuTr58i46JI6M4Tz54e7vrVFrOr3R7HSWgyQPKmM9M,5244
|
|
180
|
+
tests/fix_log_test.py,sha256=hcRy0j3j0CT0oLN7KNA0VL-_o4M-uE1amR6GziBflfU,4440
|
|
181
|
+
tests/framework_performance_test.py,sha256=Qp47VrsCK0ylEhDkFOm7lnD8rVkaJ7u1MopsEhAomrE,6985
|
|
182
|
+
tests/log_buffering_test.py,sha256=0B5UY1yQuxnBU1pEyz3IBYweN__4fOkPXly-kYfOpNU,3226
|
|
183
|
+
tests/log_generation_timing_test.py,sha256=zHb_m2FqlpRCYw-wqFWFn8cbVH8UR3VvXKSM6nNnbgo,4681
|
|
184
|
+
tests/monitor_redis_dedup.sh,sha256=2nFs5zYiguVqL2YSw_XbhGb30a_EDg0wTIV7zOa0pNg,2284
|
|
185
|
+
tests/optimized_performance_test.py,sha256=bA0dN4j7ViyTSSiCJEjlkJ9Y7jspTFKs2xX7UXHE8Gs,7379
|
|
186
|
+
tests/performance_comparison.py,sha256=UevHOM_9z2ILedf_xZ_8F8QiPjb_M8WTfGQrxzKtgco,9266
|
|
187
|
+
tests/queue_blocking_test.py,sha256=hp-6hmTOO64oOAWVtlN8cFJ95GjbK3t9fj-4q_TKowk,3955
|
|
188
|
+
tests/queue_test.py,sha256=HeBiBXqAgIAbUkLVQ3McS6NdRselA30m3lnuxNBvZbk,2689
|
|
189
|
+
tests/redis_key_validation_demo.py,sha256=WD2jvuBwHhLYIb3lVFtvYSSnmXWn1EW4EPCEwFhfi6M,4467
|
|
190
|
+
tests/request_params_example.py,sha256=J50NdsnK1sDrqG-5m3oA-mu1_wHwVwHIfsWxGeQpz7o,4250
|
|
191
|
+
tests/response_improvements_example.py,sha256=t1cbG3nesp82bqog4_ku1GvQzNbhRyWa5EaKTmOPrSk,5402
|
|
192
|
+
tests/simple_cli_test.py,sha256=t-MyZIk65B3l_JT7Ocf2K3d_bQHBhzzkyx3lvpHw6eU,1594
|
|
193
|
+
tests/simple_command_test.py,sha256=8TowzW45ukKTPeaNC5uij3RR7rqPULiBr2PguSSMdP8,3688
|
|
194
|
+
tests/simple_crawlo_test.py,sha256=FYDn5cgAxHN81QSYa_wcJcxJit7aLnIopnkHKKr83dE,4801
|
|
195
|
+
tests/simple_follow_test.py,sha256=3vNT5Eqwza6fxAY9Xl_9xtFGdfrPwm6NnVHdRmJsH8A,1053
|
|
196
|
+
tests/simple_log_test2.py,sha256=Rn3XerVlkT0M-vbQmrQL7bVIZG3REnJNmMvUvKr6C20,3944
|
|
197
|
+
tests/simple_optimization_test.py,sha256=hflvaC81ra1ZrPOp-Z7rQrH95OnSADvAjy95BLulD6o,3678
|
|
198
|
+
tests/simple_queue_type_test.py,sha256=wAf4XLKl9oS5BlfrRJ1SLY-kYmNq4YY0LdIC7HmW-yg,1193
|
|
199
|
+
tests/simple_response_selector_test.py,sha256=0naeRUX1n-oAW6VRj-12c6nre2D0RjJ0dD3Nx7BBTjY,2844
|
|
200
|
+
tests/simple_selector_helper_test.py,sha256=l9FsVhQ-z-ICqqetLIyeSaI8Dn6bXNCD8sLdr0tpvms,4438
|
|
201
|
+
tests/simple_selector_test.py,sha256=XzOYzpEzr0yaioLV6v-4XC60VZMd5jRthlyp7Ud02o4,6630
|
|
202
|
+
tests/simple_spider_test.py,sha256=RzziJg-fbIVJ6_CgbismfkwrLwpJp4WWp2RLgG7Tpws,1168
|
|
203
|
+
tests/simple_url_test.py,sha256=g9RBn46V7fHZTU0BrB5pl5AGCbw6QuKOXClVACb-MEQ,2297
|
|
204
|
+
tests/simulate_mysql_update_test.py,sha256=7BEFdQkYjgCdLN5vnieTf-ByosCcSj2QJUMOUeYlLgQ,4597
|
|
205
|
+
tests/spider_log_timing_test.py,sha256=pvYpKZemClr4mCR76xywhsiWbT5sPdzD_taZKFjlgvM,5573
|
|
206
|
+
tests/test_advanced_tools.py,sha256=HT_TcwfFzli-CavIJSqQqnCxnBn5FDMX09zL7AJ5tNY,5398
|
|
207
|
+
tests/test_all_commands.py,sha256=VgVa9SzU5Irvn5igHpC2W4E_6ZDWDt7jc-T4UPK_PFE,7718
|
|
208
|
+
tests/test_all_pipeline_fingerprints.py,sha256=NDrBYr0f9CAhjmSezTS4NUrAdcotrSX3ElJTWqjXXbU,5308
|
|
209
|
+
tests/test_all_redis_key_configs.py,sha256=dWc4Dsr07_vuSpb4hwkMpyy6XO8SI7vglVjGuGvXoa4,5710
|
|
210
|
+
tests/test_asyncmy_usage.py,sha256=gxENdxrcLlDG2m8V-j4ZnSJYFc3x6CvKvgPAhOC13DE,1688
|
|
211
|
+
tests/test_batch_processor.py,sha256=4_nYlu9R1JkDCFHq0bYc9LUNqsg41r7sQ879hkrhEts,7212
|
|
212
|
+
tests/test_cleaners.py,sha256=HDK8_YU7GUj_3hGU415cxEeUR74mnDSk0yroLlgDI0I,1816
|
|
213
|
+
tests/test_cli_arguments.py,sha256=_wNtGNLnrrw3zVyickLcI9qI6ncjms_8AH0IrCNWk4U,5443
|
|
214
|
+
tests/test_component_factory.py,sha256=V3hO5pJHSDtViLAykXSUqkeH4g-GB4GczwutrTatS2U,5809
|
|
215
|
+
tests/test_config_consistency.py,sha256=RgSxyaypMpysltsGSh1vFMeOShiZZG0rmUKzEhNLpYw,2001
|
|
216
|
+
tests/test_config_merge.py,sha256=ts1j-TIKkFS0EO5q1I4O7f4YUKR5MLTmRSqOpOlv094,5606
|
|
217
|
+
tests/test_config_validator.py,sha256=Z4gBHkI0_fEx-xgiiG4T33F4BAuePuF81obpNTXfseY,6202
|
|
218
|
+
tests/test_controlled_spider_mixin.py,sha256=AQ493ic6AxZAKd7QCgnUES92BBWCMNteTd5DjoQlhwo,2864
|
|
219
|
+
tests/test_crawler_process_import.py,sha256=iIPqSCpv2VRb_hWTu5euLME4PDFf7NwixeBypRuv39Y,1175
|
|
220
|
+
tests/test_crawler_process_spider_modules.py,sha256=uMr4esj6ascVBzt0WrPd3ZOQfKD00O6tJrNhuWOdvV0,1395
|
|
221
|
+
tests/test_crawlo_proxy_integration.py,sha256=JFBI82ILXMwAIJ29C8uhu5r-hH3UhMC50jKr5-jy6Ng,3059
|
|
222
|
+
tests/test_date_tools.py,sha256=pcLDyhLrZ_jh-PhPm4CvLZEgNeH9kLMPKN5zacHwuWM,4053
|
|
223
|
+
tests/test_dedup_fix.py,sha256=6gQKDatida54itwPtB1-HwUTKbdwwJA2Yc-HhhHj_wM,8747
|
|
224
|
+
tests/test_dedup_pipeline_consistency.py,sha256=dn5EAZSU5gQOV5EQwreHp76i5aQZ9tEdltSGO7dif5M,5176
|
|
225
|
+
tests/test_default_header_middleware.py,sha256=UDjEPIUCre1M6ndjV_uXLVCfY7WJwyN-1Xn15hzbKMo,13126
|
|
226
|
+
tests/test_distributed.py,sha256=78Pn4HPLIaO8t1IiaSkckBmuEVTcnC8IDw7znf9_Zcw,1790
|
|
227
|
+
tests/test_double_crawlo_fix.py,sha256=lZwrT5ij6Jbh0EzZswhw05FXwgKaEZsSHekLTrJJajg,7856
|
|
228
|
+
tests/test_double_crawlo_fix_simple.py,sha256=NDmCEeyvpf_D1tGQMA66iLPPKlAnSZcEg71e7GHYcjg,4768
|
|
229
|
+
tests/test_download_delay_middleware.py,sha256=Idc6KzhL3hY3aDKgn1j_v5-mLIHz7dTnV5c4tJVZh5Q,9107
|
|
230
|
+
tests/test_downloader_proxy_compatibility.py,sha256=NJJ-g_I665lHLsJZd7ONvKubHRxv82FADZR9WYzgyzA,9418
|
|
231
|
+
tests/test_edge_cases.py,sha256=460JtYR6yuTo8J4wqJScMzDkrrDUE2Q8R425AaUycIQ,11127
|
|
232
|
+
tests/test_encoding_core.py,sha256=k5fZET0R1KInhAlbbHEJv4m9d6NuibOxxfIcR43TS7Y,1681
|
|
233
|
+
tests/test_encoding_detection.py,sha256=Zb1KkF2CR57qa0Hr_Iv8msompGJZT2EIL_2mGp0zX9Q,4245
|
|
234
|
+
tests/test_enhanced_error_handler.py,sha256=Ku_86jv7iDe25v8ZxalcXxJJjIiIvQXWH8ZldbwdVm8,8581
|
|
235
|
+
tests/test_enhanced_error_handler_comprehensive.py,sha256=j_cxyIPGks9A3untKhAdj5HU0hrLbbzOLu0uAtGUlJo,9369
|
|
236
|
+
tests/test_error_handler_compatibility.py,sha256=xJ43cmCwfBGh-qBwCGiMDPPlfNDLw4ZrmlrHN9IojkU,4241
|
|
237
|
+
tests/test_factories.py,sha256=wKFfr8YBXPs-AQ8YOFgDhINn5uivKqPBZQPUe5GL9Ig,8865
|
|
238
|
+
tests/test_factory_compatibility.py,sha256=zzTXd3ku3iedgxgB1DxTt3zfetiIl6wCjL9yXIUCpic,6260
|
|
239
|
+
tests/test_final_validation.py,sha256=OuZI01O0E68Pao--bD-BFDTRZFPc_Mt4W-OXUzlt6ZA,4966
|
|
240
|
+
tests/test_fingerprint_consistency.py,sha256=68V5u_2hNABI5pNWzXUrA1PJ08Xh9x3-JsMSNNjORMo,4956
|
|
241
|
+
tests/test_fingerprint_simple.py,sha256=qiSba8gF3Zl91QO_ijJO7KstLdjATs30V_GZCNHShig,1626
|
|
242
|
+
tests/test_get_component_logger.py,sha256=UKj5uT1F3L3atoJFmpk7QSDO2fZHgw-7Y84vMFbHRkM,2285
|
|
243
|
+
tests/test_hash_performance.py,sha256=4eVPwbu66Oun0LVyTTNd9d2cj2V1xq0YZkRg8Z0TO-Q,3211
|
|
244
|
+
tests/test_integration.py,sha256=lVEzKNAjFzFZHRNZAyJmXxa_5Ogf_qqL4APqs620o58,4839
|
|
245
|
+
tests/test_item_dedup_redis_key.py,sha256=dp_H59exJLaZHh5oMtmMEOWh-DNZwbnwIFYDjOpHgd0,3842
|
|
246
|
+
tests/test_large_scale_helper.py,sha256=0L6EKHcKgh7XHvoW4wRSkxmw8GolUwSOCgZ_-ZmCyDo,8371
|
|
247
|
+
tests/test_logging_enhancements.py,sha256=YHcYWC8PG_AP5wZnmOr6H7QuU7m-3xzxEhppM0Jubvg,12731
|
|
248
|
+
tests/test_logging_final.py,sha256=K9vxyODslXza05hElVEcvzbXgzthYKK5CRj4UJTftIw,6376
|
|
249
|
+
tests/test_logging_integration.py,sha256=5WpExyt6BmYBZwrjqtQIGOw1Id64opJBAIahDk70Mlc,11131
|
|
250
|
+
tests/test_logging_system.py,sha256=LGfK14ZEWzRtl3_VkBGz-AaVa_dDtuC5zu40m8FvmMo,9206
|
|
251
|
+
tests/test_middleware_debug.py,sha256=gtiaWCxBSTcaNkdqXirM7CsThr_HfiCueBdQCpp7rqg,4572
|
|
252
|
+
tests/test_mode_consistency.py,sha256=t72WX0etC_AayaL2AT6e2lIgbfP-zxTgYAiTARSN2Jk,1276
|
|
253
|
+
tests/test_multi_directory.py,sha256=sH9Y3B-fuESlc7J1aICa-AlBcCW8HFR-Q5j2anUr8l0,2196
|
|
254
|
+
tests/test_multiple_spider_modules.py,sha256=M0wPyQW7HMasbMIgn_R78wjZEj4A_DgqaGHp0qF9Y0c,2567
|
|
255
|
+
tests/test_mysql_pipeline_config.py,sha256=5Yveo4cPiGOG22EO5493QkC2m3ocKfv0Y2jK9m_4aZU,6793
|
|
256
|
+
tests/test_mysql_pipeline_error.py,sha256=htqZBnEIF3kIML53u8Sv4_PnyRep-0JJFApuD8FpkFQ,3529
|
|
257
|
+
tests/test_mysql_pipeline_init_log.py,sha256=-x9M2wqfa5g3jZ-y7iIPIOqEle0HouC28YECWfSE5OQ,2516
|
|
258
|
+
tests/test_mysql_pipeline_integration.py,sha256=fhBwU0ewH3nc1ol1JH4xpVTGrqlIttBghkqtxtOgMF0,4208
|
|
259
|
+
tests/test_mysql_pipeline_refactor.py,sha256=yJzBBgoIavQjXWQtivP0j8kAwmbb8zybypHqdLbfd_c,5804
|
|
260
|
+
tests/test_mysql_pipeline_refactor_simple.py,sha256=QmF2Zv-0FyWMs6SYNXQPC3GW1rVyPnKmM_2rGOtxCps,3724
|
|
261
|
+
tests/test_mysql_pipeline_robustness.py,sha256=cmjDOv9FX1OAFHJaY3WkveCSOTZiiZKu5ehjHaI-QW0,6138
|
|
262
|
+
tests/test_mysql_pipeline_types.py,sha256=dIs4aYlV9vsGfhvmDHOc-LCx-jDqUzoAkn-v8i2ae7Y,2474
|
|
263
|
+
tests/test_mysql_update_columns.py,sha256=CyEshc7b_yprIXcQtNOaWvCC2ZDb0kzjLOfmd8r3sOY,3458
|
|
264
|
+
tests/test_offsite_middleware.py,sha256=njpXTdngOqBs60Wj6xgo5EEXlJnMHd7vtYGi9dVauW0,10602
|
|
265
|
+
tests/test_offsite_middleware_simple.py,sha256=4MfDKSXGHcoFLYnnxCH2rmnzztWyN0xByYLoHtepyiA,7918
|
|
266
|
+
tests/test_optimized_selector_naming.py,sha256=fbmlB5S2kBwtQWpWoQ4lQ7rUQm2_DeWK-t6KqvIRTUQ,2787
|
|
267
|
+
tests/test_parsel.py,sha256=wuZqRFIm9xx1tt6o3Xi_OjvwhT_MPmHiUEj2ax06zlo,701
|
|
268
|
+
tests/test_performance.py,sha256=Lqs2iu3dmWipZkBPARcwIjDLXsqe42ntz1M4RzqqXKo,11457
|
|
269
|
+
tests/test_performance_monitor.py,sha256=paW3HGg6ReHb9lwnOivGCrI8STwbwp_mbuhgfds1h3I,4187
|
|
270
|
+
tests/test_pipeline_fingerprint_consistency.py,sha256=LL55oGSDGy0K8LxoyKa6ogNHXhJlZHe509vCFbibLkk,2847
|
|
271
|
+
tests/test_priority_behavior.py,sha256=JQ5uv80cAUKV9Eh3S8j5zxYSSL-dmzhwhuKOINM26zU,9325
|
|
272
|
+
tests/test_priority_consistency.py,sha256=rVX7nku5N_QpB_ffDu3xqREkCWPX5aNNiXy112o9wpA,5756
|
|
273
|
+
tests/test_priority_consistency_fixed.py,sha256=MlYi5PIr5wxunC3Ku4ilnxOatKyRu2qIvhV7pjadkjg,10765
|
|
274
|
+
tests/test_proxy_health_check.py,sha256=_tDlxa_6TdL3M5RLkHF82roXJ8WIuG5hELBp2GADyKQ,1123
|
|
275
|
+
tests/test_proxy_middleware.py,sha256=MC2Hg88Pdpv6i_gTAy4ocIWOOxQ8bF7hYtszwpOzilE,8716
|
|
276
|
+
tests/test_proxy_middleware_enhanced.py,sha256=N7Ly3koCH2uRYk6pxhEJwWpChKdIucdrj0nKvq_E4bw,6896
|
|
277
|
+
tests/test_proxy_middleware_integration.py,sha256=PQhJKM1uGtQTlBh7XlKWAMwNwQ6K8of-P15KHDF2dJg,4729
|
|
278
|
+
tests/test_proxy_middleware_refactored.py,sha256=Z4szCDqyjAwWtgDoddgfeNIVsVefPcrfsZP57gCMrJQ,8272
|
|
279
|
+
tests/test_proxy_only.py,sha256=OqF3An_s9VY4mfLX7kDRz_LMtLpNzC6LS2kQkEyiBRw,2563
|
|
280
|
+
tests/test_proxy_providers.py,sha256=u_R2fhab90vqvQEaOAztpAOe9tJXvUMIdoDxmStmXJ4,1749
|
|
281
|
+
tests/test_proxy_stats.py,sha256=ES00CEoDITYPFBGPk8pecFzD3ItYIv6NSpcqNd8-kvo,526
|
|
282
|
+
tests/test_proxy_strategies.py,sha256=9Z1pXmTNyw-eIhGXlf2abZbJx6igLohYq-_3hldQ5uE,1868
|
|
283
|
+
tests/test_proxy_with_downloader.py,sha256=6OqyLcIM9nPMhL9bCYUIeSvYValKPw72XC-Up8jRri8,4597
|
|
284
|
+
tests/test_queue_empty_check.py,sha256=ZJC6jOgZq0Wb0-ubrB1ZNcCaUiWeCxoNZmjkd6PY6t0,1182
|
|
285
|
+
tests/test_queue_manager_double_crawlo.py,sha256=MijZ3JuyHMuqGbRC-8kclFr-4O7m_T8CqezP4qiWk-E,6957
|
|
286
|
+
tests/test_queue_manager_redis_key.py,sha256=txHLq5XUZZN7h9HUlqlUCEVCTe2IXdf9r7F_P2zNVdY,7117
|
|
287
|
+
tests/test_queue_naming.py,sha256=GzPqxvATF9A5iQMgn2wQM68qTHTbsQ9dPhktAkyzDG4,4786
|
|
288
|
+
tests/test_queue_type.py,sha256=N8y3s0Cwco-XphRcIiR4bQuNAEOgmxvlRoR1jzghTtY,3304
|
|
289
|
+
tests/test_queue_type_redis_config_consistency.py,sha256=1ew7Zp9CxH1DQ0RUmsZMV-n7s8B5dCly6u3FkJbR1qE,5259
|
|
290
|
+
tests/test_random_headers_default.py,sha256=ulDb3_kRpnTCN1-TO3m6wVM-eMkZS_ezsSbd1ur8Xpg,12772
|
|
291
|
+
tests/test_random_headers_necessity.py,sha256=SSbNQIE347oCQvuG6yaAambFU-3MyQzTV5jN1kArRGY,11741
|
|
292
|
+
tests/test_random_user_agent.py,sha256=6HjU4iUcMk-J6bR2N5FhIkWDfnaFKAPNVyRzxmQQ14k,2302
|
|
293
|
+
tests/test_redis_config.py,sha256=51_Fy1PqIhS0MMO2nR4q6oQjBFxfqcUPK_4NNf5s83g,903
|
|
294
|
+
tests/test_redis_connection_pool.py,sha256=pKfXdE3Cm_L_fNqI9zqFmqiidCwR0t7hiM_Fu_V1cNI,9328
|
|
295
|
+
tests/test_redis_key_naming.py,sha256=MTFk656JhiGVTsMctBDhBNOMFcBDZrsQA3UfPZ-Dgj4,6911
|
|
296
|
+
tests/test_redis_key_validator.py,sha256=GszSzGADgk3uN6Bye1d8pS-AtMVgB8jwqW-22gPNM6M,4418
|
|
297
|
+
tests/test_redis_queue.py,sha256=WQV3MtGg8rJzHgC2kRfXM6lSMXpwXJVQZfqn2dVrhg0,6758
|
|
298
|
+
tests/test_redis_queue_name_fix.py,sha256=9V-qDmUz97wOdPv8pKcVnQRxeZ126WSdB5JBnow4ho8,5770
|
|
299
|
+
tests/test_redis_queue_type_fallback.py,sha256=Bg6b5bqt-TKotE_wWdkaZNQr2WXT8gaDfolv8785NyE,4692
|
|
300
|
+
tests/test_request_ignore_middleware.py,sha256=QN81wgG_W_XfXCF9LvJNxCNwbOH6_tZnLIwLDTK2K5Q,6229
|
|
301
|
+
tests/test_request_params.py,sha256=l2etiDebqylPBym1e9DSDn4wxwTHv8DQHKq9AzlzlG0,4287
|
|
302
|
+
tests/test_request_serialization.py,sha256=Ikgec8tt_sPCK6jcZyK8vRw84zRNE6nxQy9rba1WKmE,2332
|
|
303
|
+
tests/test_response_code_middleware.py,sha256=wSe525bm-bk_iWMjPDzUu1LfOQrwJY8_MLKAspq2dzk,12193
|
|
304
|
+
tests/test_response_filter_middleware.py,sha256=YWrGzJ7wmftTjJXcNTtJl3b3EdJsO4oR22ZLWwgErhg,16327
|
|
305
|
+
tests/test_response_follow.py,sha256=gjVZ_knsuHUaCDOjRPk-qG9HRCwReXlVrIx_KpveRHM,3738
|
|
306
|
+
tests/test_response_improvements.py,sha256=vNqHKyoEoYeEGAUiRzdsff2V6yvJ9QnDwGg7gmN38Ow,6028
|
|
307
|
+
tests/test_response_selector_methods.py,sha256=6aS7q_PBx601MnXbCze-ZWNO-uCKFVjhxcCg9NJqKrI,2738
|
|
308
|
+
tests/test_response_url_methods.py,sha256=plOpSN3JLRI8-lbj4cva8-_jRFdDwmax9Gkv6O2Ac-s,2759
|
|
309
|
+
tests/test_response_urljoin.py,sha256=uXTWhFx8-XBb-Vaghn9YKJz5ThkwRuNykBWW4S7f3go,3379
|
|
310
|
+
tests/test_retry_middleware.py,sha256=mi7s4HDAqmmd9nvyxs3ZgxdEKOYkCgDu3rDvU_9o8vQ,11133
|
|
311
|
+
tests/test_retry_middleware_realistic.py,sha256=Sam5y4jCN8oeElU4xxeS5zjAyzS-P8siPV7OaifgsyU,9679
|
|
312
|
+
tests/test_scheduler.py,sha256=1fCu35QgK5gzgrhD0aUZj5lxL0QbokzPav-yEJxz9Ig,8182
|
|
313
|
+
tests/test_scheduler_config_update.py,sha256=LuxjEbt20QrPyVkjSFxvTnFtUxwMaHB6TcqjFyo8bow,4261
|
|
314
|
+
tests/test_scrapy_style_encoding.py,sha256=2K_0lHsYqop4qb5lO1U8g7hbae4nkMPrbEvVTl5TT9Y,3408
|
|
315
|
+
tests/test_selector_helper.py,sha256=-fw8p-uJixTKso7OLUBTVJ2oOjL8LIJA1WDetzthGO0,2818
|
|
316
|
+
tests/test_selector_optimizations.py,sha256=5t5RrDkcy0YtK2Es9DBfi3Cejfv6yV4dagulIQhmEho,4665
|
|
317
|
+
tests/test_simple_response.py,sha256=_ui2PuVZvJcAuLY7HZ8xcsy_tDBimgBqX0ukj3kE5J0,1549
|
|
318
|
+
tests/test_spider_loader.py,sha256=-myi78LztwABeaCpJj-DzO2CxNEYW8lavtVuUreoHcI,1314
|
|
319
|
+
tests/test_spider_loader_comprehensive.py,sha256=gp6SWrDQcrg4RFNkLJQWDQ16NDfpdOlg0rCyJ86-F-8,2591
|
|
320
|
+
tests/test_spider_modules.py,sha256=wxPs28FtpGnQTemMY6r7WxVrwYo3bHnAd5dq94qj1K4,2797
|
|
321
|
+
tests/test_telecom_spider_redis_key.py,sha256=c-gfixPul2VlYMQJGf0H5ZgYJ461fQgSKbCPrbAU45M,7625
|
|
322
|
+
tests/test_template_content.py,sha256=2RgCdOA3pMUSOqC_JbTGeW7KonbTqJ0ySYJNWegU-v0,2903
|
|
323
|
+
tests/test_template_redis_key.py,sha256=99-s0_-8MFJbIvGG_X__sH0qkXWTtJv8fdTdlftsq4I,4876
|
|
324
|
+
tests/test_tools.py,sha256=z50Bvq_q8FwpyxNkmh00_A3sXkSv2l1Q_EbK02FDYgk,5504
|
|
325
|
+
tests/test_user_agent_randomness.py,sha256=tE8_zh-BjMAQ9CTgScxZze6JarNher6COkdoLU68YfA,5681
|
|
326
|
+
tests/test_user_agents.py,sha256=e4haX-o8Janl-PawGJ9MemZyMqTX33_tBF_WnYSVoUw,3327
|
|
327
|
+
tests/untested_features_report.md,sha256=31aUlsw_1OKe0_ijAjeH85kJ7HJ8qzKLJdOHDjWtYdY,4169
|
|
328
|
+
tests/verify_debug.py,sha256=iQ4Efwg9bQTHscr73VYAAZ8rBIe1u6mQfeaEK5YgneY,1564
|
|
329
|
+
tests/verify_distributed.py,sha256=0IolM4ymuPOz_uTfHSWFO3Vxzp7Lo6i0zhSbzJhHFtI,4045
|
|
330
|
+
tests/verify_log_fix.py,sha256=7reyVl3MXTDASyChgU5BAYuzuxvFjSLG9HywAHso0qg,4336
|
|
331
|
+
tests/verify_mysql_warnings.py,sha256=TMPsB1yp7R_c3S6LllgPJ-n_4He6gHVygAC81zbeQrc,4106
|
|
332
|
+
tests/ofweek_scrapy/scrapy.cfg,sha256=D_8rsW65iTbH7nG1kI25jYTCpoQKBVa2shajrsC6fBw,280
|
|
333
|
+
tests/ofweek_scrapy/ofweek_scrapy/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
334
|
+
tests/ofweek_scrapy/ofweek_scrapy/items.py,sha256=Y_TwwHPAgOXTuCTdnhRxil7vYPk1_rzj1ZatTq4AX-I,280
|
|
335
|
+
tests/ofweek_scrapy/ofweek_scrapy/middlewares.py,sha256=O4jVSXZgxtsRzU9O_O3YdkS7_QLndzv3uYP-Op8g254,3654
|
|
336
|
+
tests/ofweek_scrapy/ofweek_scrapy/pipelines.py,sha256=ZO6WqTqPpTwLvnwO7YL0E35OPp4zSfJ_GhMeshNRSow,379
|
|
337
|
+
tests/ofweek_scrapy/ofweek_scrapy/settings.py,sha256=X3Y6goZluAz0n2bepWAKEhZX0URFfe9_lBRBCPgtLPk,2933
|
|
338
|
+
tests/ofweek_scrapy/ofweek_scrapy/spiders/__init__.py,sha256=a-Jax6MTMZC2HOw3mUBcNu-T44dOUHDsb22Oly4HTnM,165
|
|
339
|
+
tests/scrapy_comparison/ofweek_scrapy.py,sha256=rhVds_WjYum1bLuWWe90HtXE51fZXEqhhPSc822ZasQ,5790
|
|
340
|
+
tests/scrapy_comparison/scrapy_test.py,sha256=-IsGUHPBgEL0TmXjeLZl-TUA01B7Dsc2nRo4JZbFwZA,5599
|
|
341
|
+
tests/test_spiders/__init__.py,sha256=Ws2DhfUA0Xh5Cxr9M46td7B6hyNoLTyAhZ60FnIh6D0,20
|
|
342
|
+
tests/test_spiders/test_spider.py,sha256=kNGEg80HMMFgzVseI1jJjljZEBy3QYKt_3SXGASffFM,168
|
|
343
|
+
crawlo-1.4.8.dist-info/METADATA,sha256=-3vWrJ0Mpd-DMRD4S0bRZwzUuKF17FyauuSI78eD7fo,24526
|
|
344
|
+
crawlo-1.4.8.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
345
|
+
crawlo-1.4.8.dist-info/entry_points.txt,sha256=5HoVoTSPxI8SCa5B7pQYxLSrkOdiunyO9tqNsLMv52g,43
|
|
346
|
+
crawlo-1.4.8.dist-info/top_level.txt,sha256=keG_67pbZ_wZL2dmDRA9RMaNHTaV_x_oxZ9DKNgwvR0,22
|
|
347
|
+
crawlo-1.4.8.dist-info/RECORD,,
|
examples/__init__.py
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
#!/usr/bin/python
|
|
2
|
-
# -*- coding:UTF-8 -*-
|
|
3
|
-
"""
|
|
4
|
-
# @Time : 2025-02-05 12:36
|
|
5
|
-
# @Author : oscar
|
|
6
|
-
# @Desc : None
|
|
7
|
-
"""
|
|
1
|
+
#!/usr/bin/python
|
|
2
|
+
# -*- coding:UTF-8 -*-
|
|
3
|
+
"""
|
|
4
|
+
# @Time : 2025-02-05 12:36
|
|
5
|
+
# @Author : oscar
|
|
6
|
+
# @Desc : None
|
|
7
|
+
"""
|
tests/__init__.py
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
#!/usr/bin/python
|
|
2
|
-
# -*- coding:UTF-8 -*-
|
|
3
|
-
"""
|
|
4
|
-
# @Time : 2025-08-24 12:36
|
|
5
|
-
# @Author : crawl-coder
|
|
6
|
-
# @Desc : None
|
|
7
|
-
"""
|
|
1
|
+
#!/usr/bin/python
|
|
2
|
+
# -*- coding:UTF-8 -*-
|
|
3
|
+
"""
|
|
4
|
+
# @Time : 2025-08-24 12:36
|
|
5
|
+
# @Author : crawl-coder
|
|
6
|
+
# @Desc : None
|
|
7
|
+
"""
|