crawlo 1.0.6__tar.gz → 1.0.7__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of crawlo might be problematic. Click here for more details.

Files changed (103) hide show
  1. {crawlo-1.0.6/crawlo.egg-info → crawlo-1.0.7}/PKG-INFO +1 -1
  2. crawlo-1.0.7/crawlo/__version__.py +1 -0
  3. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/items/__init__.py +2 -1
  4. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/items/base.py +1 -10
  5. {crawlo-1.0.6 → crawlo-1.0.7/crawlo.egg-info}/PKG-INFO +1 -1
  6. crawlo-1.0.6/crawlo/__version__.py +0 -1
  7. {crawlo-1.0.6 → crawlo-1.0.7}/LICENSE +0 -0
  8. {crawlo-1.0.6 → crawlo-1.0.7}/MANIFEST.in +0 -0
  9. {crawlo-1.0.6 → crawlo-1.0.7}/README.md +0 -0
  10. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/__init__.py +0 -0
  11. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/cli.py +0 -0
  12. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/commands/__init__.py +0 -0
  13. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/commands/genspider.py +0 -0
  14. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/commands/run.py +0 -0
  15. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/commands/startproject.py +0 -0
  16. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/core/__init__.py +0 -0
  17. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/core/engine.py +0 -0
  18. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/core/processor.py +0 -0
  19. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/core/scheduler.py +0 -0
  20. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/crawler.py +0 -0
  21. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/downloader/__init__.py +0 -0
  22. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/downloader/aiohttp_downloader.py +0 -0
  23. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/downloader/cffi_downloader.py +0 -0
  24. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/downloader/httpx_downloader.py +0 -0
  25. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/event.py +0 -0
  26. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/exceptions.py +0 -0
  27. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/extension/__init__.py +0 -0
  28. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/extension/log_interval.py +0 -0
  29. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/extension/log_stats.py +0 -0
  30. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/extension/logging_extension.py +0 -0
  31. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/filters/__init__.py +0 -0
  32. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/filters/aioredis_filter.py +0 -0
  33. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/filters/memory_filter.py +0 -0
  34. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/items/fields.py +0 -0
  35. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/items/items.py +0 -0
  36. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/middleware/__init__.py +0 -0
  37. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/middleware/default_header.py +0 -0
  38. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/middleware/download_delay.py +0 -0
  39. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/middleware/middleware_manager.py +0 -0
  40. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/middleware/proxy.py +0 -0
  41. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/middleware/request_ignore.py +0 -0
  42. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/middleware/response_code.py +0 -0
  43. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/middleware/response_filter.py +0 -0
  44. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/middleware/retry.py +0 -0
  45. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/network/__init__.py +0 -0
  46. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/network/request.py +0 -0
  47. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/network/response.py +0 -0
  48. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/pipelines/__init__.py +0 -0
  49. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/pipelines/console_pipeline.py +0 -0
  50. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/pipelines/mongo_pipeline.py +0 -0
  51. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/pipelines/mysql_batch_pipline.py +0 -0
  52. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/pipelines/mysql_pipeline.py +0 -0
  53. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/pipelines/pipeline_manager.py +0 -0
  54. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/settings/__init__.py +0 -0
  55. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/settings/default_settings.py +0 -0
  56. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/settings/setting_manager.py +0 -0
  57. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/spider/__init__.py +0 -0
  58. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/stats_collector.py +0 -0
  59. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/subscriber.py +0 -0
  60. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/task_manager.py +0 -0
  61. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/templates/crawlo.cfg.tmpl +0 -0
  62. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/templates/project/__init__.py.tmpl +0 -0
  63. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/templates/project/items.py.tmpl +0 -0
  64. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/templates/project/middlewares.py.tmpl +0 -0
  65. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/templates/project/pipelines.py.tmpl +0 -0
  66. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/templates/project/settings.py.tmpl +0 -0
  67. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/templates/project/spiders/__init__.py.tmpl +0 -0
  68. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/templates/spider/spider.py.tmpl +0 -0
  69. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/__init__.py +0 -0
  70. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/concurrency_manager.py +0 -0
  71. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/date_tools.py +0 -0
  72. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/db_helper.py +0 -0
  73. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/func_tools.py +0 -0
  74. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/log.py +0 -0
  75. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/pqueue.py +0 -0
  76. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/project.py +0 -0
  77. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/request.py +0 -0
  78. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/spider_loader.py +0 -0
  79. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/system.py +0 -0
  80. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/tools.py +0 -0
  81. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo/utils/url.py +0 -0
  82. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo.egg-info/SOURCES.txt +0 -0
  83. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo.egg-info/dependency_links.txt +0 -0
  84. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo.egg-info/entry_points.txt +0 -0
  85. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo.egg-info/requires.txt +0 -0
  86. {crawlo-1.0.6 → crawlo-1.0.7}/crawlo.egg-info/top_level.txt +0 -0
  87. {crawlo-1.0.6 → crawlo-1.0.7}/examples/__init__.py +0 -0
  88. {crawlo-1.0.6 → crawlo-1.0.7}/examples/gxb/__init__.py +0 -0
  89. {crawlo-1.0.6 → crawlo-1.0.7}/examples/gxb/items.py +0 -0
  90. {crawlo-1.0.6 → crawlo-1.0.7}/examples/gxb/run.py +0 -0
  91. {crawlo-1.0.6 → crawlo-1.0.7}/examples/gxb/settings.py +0 -0
  92. {crawlo-1.0.6 → crawlo-1.0.7}/examples/gxb/spider/__init__.py +0 -0
  93. {crawlo-1.0.6 → crawlo-1.0.7}/examples/gxb/spider/miit_spider.py +0 -0
  94. {crawlo-1.0.6 → crawlo-1.0.7}/examples/gxb/spider/telecom_device.py +0 -0
  95. {crawlo-1.0.6 → crawlo-1.0.7}/pyproject.toml +0 -0
  96. {crawlo-1.0.6 → crawlo-1.0.7}/requirements.txt +0 -0
  97. {crawlo-1.0.6 → crawlo-1.0.7}/setup.cfg +0 -0
  98. {crawlo-1.0.6 → crawlo-1.0.7}/tests/__init__.py +0 -0
  99. {crawlo-1.0.6 → crawlo-1.0.7}/tests/test_proxy_health_check.py +0 -0
  100. {crawlo-1.0.6 → crawlo-1.0.7}/tests/test_proxy_middleware_integration.py +0 -0
  101. {crawlo-1.0.6 → crawlo-1.0.7}/tests/test_proxy_providers.py +0 -0
  102. {crawlo-1.0.6 → crawlo-1.0.7}/tests/test_proxy_stats.py +0 -0
  103. {crawlo-1.0.6 → crawlo-1.0.7}/tests/test_proxy_strategies.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: crawlo
3
- Version: 1.0.6
3
+ Version: 1.0.7
4
4
  Summary: Crawlo 是一款基于异步IO的高性能Python爬虫框架,支持分布式抓取。
5
5
  Home-page: https://github.com/crawl-coder/Crawlo.git
6
6
  Author: crawl-coder
@@ -0,0 +1 @@
1
+ __version__ = "1.0.7"
@@ -5,9 +5,10 @@ crawlo.items 包
5
5
  ===============
6
6
  提供 Item 和 Field 类用于数据定义和验证。
7
7
  """
8
- from .fields import Field
9
8
  from .items import Item
9
+ from .fields import Field
10
10
  from .base import ItemMeta
11
+
11
12
  from crawlo.exceptions import ItemInitError, ItemAttributeError
12
13
 
13
14
  __all__ = [
@@ -4,28 +4,19 @@
4
4
  基础元类定义
5
5
  """
6
6
  from abc import ABCMeta
7
-
8
- from crawlo.items import Field
9
-
7
+ from .fields import Field
10
8
 
11
9
  class ItemMeta(ABCMeta):
12
- """
13
- 元类,用于自动收集 Item 类中的 Field 定义
14
- """
15
-
16
10
  def __new__(mcs, name, bases, attrs):
17
11
  fields = {}
18
12
  cls_attrs = {}
19
13
 
20
- # 收集所有 Field 实例
21
14
  for attr_name, attr_value in attrs.items():
22
15
  if isinstance(attr_value, Field):
23
16
  fields[attr_name] = attr_value
24
17
  else:
25
18
  cls_attrs[attr_name] = attr_value
26
19
 
27
- # 创建类实例
28
20
  cls_instance = super().__new__(mcs, name, bases, cls_attrs)
29
21
  cls_instance.FIELDS = fields
30
-
31
22
  return cls_instance
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: crawlo
3
- Version: 1.0.6
3
+ Version: 1.0.7
4
4
  Summary: Crawlo 是一款基于异步IO的高性能Python爬虫框架,支持分布式抓取。
5
5
  Home-page: https://github.com/crawl-coder/Crawlo.git
6
6
  Author: crawl-coder
@@ -1 +0,0 @@
1
- __version__ = "1.0.6"
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes