cobweb-launcher 1.1.14__tar.gz → 1.1.16__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of cobweb-launcher might be problematic. Click here for more details.

Files changed (37) hide show
  1. {cobweb-launcher-1.1.14/cobweb_launcher.egg-info → cobweb-launcher-1.1.16}/PKG-INFO +1 -1
  2. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/crawlers/base_crawler.py +20 -21
  3. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16/cobweb_launcher.egg-info}/PKG-INFO +1 -1
  4. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/setup.py +1 -1
  5. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/LICENSE +0 -0
  6. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/README.md +0 -0
  7. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/__init__.py +0 -0
  8. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/base/__init__.py +0 -0
  9. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/base/common_queue.py +0 -0
  10. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/base/decorators.py +0 -0
  11. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/base/item.py +0 -0
  12. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/base/log.py +0 -0
  13. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/base/request.py +0 -0
  14. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/base/response.py +0 -0
  15. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/base/seed.py +0 -0
  16. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/constant.py +0 -0
  17. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/crawlers/__init__.py +0 -0
  18. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/crawlers/file_crawler.py +0 -0
  19. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/db/__init__.py +0 -0
  20. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/db/redis_db.py +0 -0
  21. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/exceptions/__init__.py +0 -0
  22. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/exceptions/oss_db_exception.py +0 -0
  23. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/launchers/__init__.py +0 -0
  24. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/launchers/launcher.py +0 -0
  25. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/launchers/launcher_pro.py +0 -0
  26. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/pipelines/__init__.py +0 -0
  27. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/pipelines/base_pipeline.py +0 -0
  28. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/pipelines/loghub_pipeline.py +0 -0
  29. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/setting.py +0 -0
  30. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/utils/__init__.py +0 -0
  31. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/utils/oss.py +0 -0
  32. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb/utils/tools.py +0 -0
  33. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb_launcher.egg-info/SOURCES.txt +0 -0
  34. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb_launcher.egg-info/dependency_links.txt +0 -0
  35. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb_launcher.egg-info/requires.txt +0 -0
  36. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/cobweb_launcher.egg-info/top_level.txt +0 -0
  37. {cobweb-launcher-1.1.14 → cobweb-launcher-1.1.16}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: cobweb-launcher
3
- Version: 1.1.14
3
+ Version: 1.1.16
4
4
  Summary: spider_hole
5
5
  Home-page: https://github.com/Juannie-PP/cobweb
6
6
  Author: Juannie-PP
@@ -69,30 +69,29 @@ class Crawler(threading.Thread):
69
69
  continue
70
70
 
71
71
  elif seed.params.retry >= self.max_retries:
72
- seed.params.identifier = DealModel.fail
72
+ seed.identifier = DealModel.fail
73
73
  self.launcher_queue['done'].push(seed)
74
74
  continue
75
75
 
76
76
  seed_detail_log_info = download_log_info(seed.to_dict)
77
77
 
78
- request_iterators = self.request(seed)
78
+ try:
79
+ request_iterators = self.request(seed)
79
80
 
80
- if not isgenerator(request_iterators):
81
- raise TypeError("request function isn't a generator!")
81
+ if not isgenerator(request_iterators):
82
+ raise TypeError("request function isn't a generator!")
82
83
 
83
- for request_item in request_iterators:
84
+ for request_item in request_iterators:
84
85
 
85
- if isinstance(request_item, BaseItem):
86
- self.upload_queue.push(request_item)
86
+ if isinstance(request_item, BaseItem):
87
+ self.upload_queue.push(request_item)
87
88
 
88
- elif isinstance(request_item, Request):
89
- try:
89
+ elif isinstance(request_item, Request):
90
90
  download_iterators = self.download(request_item)
91
91
  if not isgenerator(download_iterators):
92
92
  raise TypeError("download function isn't a generator")
93
93
  for download_item in download_iterators:
94
94
  if isinstance(download_item, Response):
95
- response_detail_log_info = download_log_info(download_item.to_dict)
96
95
  logger.info(LogTemplate.download_info.format(
97
96
  detail=seed_detail_log_info,
98
97
  retry=seed.params.retry,
@@ -100,7 +99,7 @@ class Crawler(threading.Thread):
100
99
  seed_version=seed.params.seed_version,
101
100
  identifier=seed.identifier or "",
102
101
  status=download_item.response,
103
- response=response_detail_log_info
102
+ response=download_log_info(download_item.to_dict)
104
103
  ))
105
104
  parse_iterators = self.parse(download_item)
106
105
  if not isgenerator(parse_iterators):
@@ -111,16 +110,16 @@ class Crawler(threading.Thread):
111
110
  self.distribute(parse_item, seed)
112
111
  else:
113
112
  self.distribute(download_item, seed)
114
- except Exception as e:
115
- logger.info(LogTemplate.download_exception.format(
116
- detail=seed_detail_log_info,
117
- retry=seed.params.retry,
118
- priority=seed.params.priority,
119
- seed_version=seed.params.seed_version,
120
- identifier=seed.identifier or "", exception=e
121
- ))
122
- seed.params.retry += 1
123
- self.launcher_queue['todo'].push(seed)
113
+ except Exception as e:
114
+ logger.info(LogTemplate.download_exception.format(
115
+ detail=seed_detail_log_info,
116
+ retry=seed.params.retry,
117
+ priority=seed.params.priority,
118
+ seed_version=seed.params.seed_version,
119
+ identifier=seed.identifier or "", exception=e
120
+ ))
121
+ seed.params.retry += 1
122
+ self.launcher_queue['todo'].push(seed)
124
123
 
125
124
  def run(self):
126
125
  for index in range(self.spider_thread_num):
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: cobweb-launcher
3
- Version: 1.1.14
3
+ Version: 1.1.16
4
4
  Summary: spider_hole
5
5
  Home-page: https://github.com/Juannie-PP/cobweb
6
6
  Author: Juannie-PP
@@ -5,7 +5,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
5
5
 
6
6
  setup(
7
7
  name="cobweb-launcher",
8
- version="1.1.14",
8
+ version="1.1.16",
9
9
  packages=find_packages(),
10
10
  url="https://github.com/Juannie-PP/cobweb",
11
11
  license="MIT",