cobweb-launcher 1.2.5__tar.gz → 1.2.6__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of cobweb-launcher might be problematic. Click here for more details.

Files changed (38) hide show
  1. {cobweb-launcher-1.2.5/cobweb_launcher.egg-info → cobweb-launcher-1.2.6}/PKG-INFO +1 -1
  2. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/crawlers/crawler.py +1 -1
  3. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/launchers/launcher.py +2 -2
  4. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/launchers/launcher_pro.py +7 -11
  5. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/setting.py +1 -1
  6. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6/cobweb_launcher.egg-info}/PKG-INFO +1 -1
  7. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/setup.py +1 -1
  8. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/LICENSE +0 -0
  9. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/README.md +0 -0
  10. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/__init__.py +0 -0
  11. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/base/__init__.py +0 -0
  12. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/base/common_queue.py +0 -0
  13. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/base/decorators.py +0 -0
  14. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/base/item.py +0 -0
  15. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/base/log.py +0 -0
  16. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/base/request.py +0 -0
  17. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/base/response.py +0 -0
  18. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/base/seed.py +0 -0
  19. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/constant.py +0 -0
  20. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/crawlers/__init__.py +0 -0
  21. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/db/__init__.py +0 -0
  22. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/db/redis_db.py +0 -0
  23. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/exceptions/__init__.py +0 -0
  24. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/exceptions/oss_db_exception.py +0 -0
  25. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/launchers/__init__.py +0 -0
  26. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/launchers/launcher_air.py +0 -0
  27. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/pipelines/__init__.py +0 -0
  28. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/pipelines/pipeline.py +0 -0
  29. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/pipelines/pipeline_console.py +0 -0
  30. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/pipelines/pipeline_loghub.py +0 -0
  31. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/utils/__init__.py +0 -0
  32. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/utils/oss.py +0 -0
  33. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb/utils/tools.py +0 -0
  34. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb_launcher.egg-info/SOURCES.txt +0 -0
  35. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb_launcher.egg-info/dependency_links.txt +0 -0
  36. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb_launcher.egg-info/requires.txt +0 -0
  37. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/cobweb_launcher.egg-info/top_level.txt +0 -0
  38. {cobweb-launcher-1.2.5 → cobweb-launcher-1.2.6}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: cobweb-launcher
3
- Version: 1.2.5
3
+ Version: 1.2.6
4
4
  Summary: spider_hole
5
5
  Home-page: https://github.com/Juannie-PP/cobweb
6
6
  Author: Juannie-PP
@@ -86,7 +86,7 @@ class Crawler(threading.Thread):
86
86
  time.sleep(1)
87
87
  continue
88
88
 
89
- elif seed.params.retry >= self.max_retries:
89
+ elif seed.params.retry > self.max_retries:
90
90
  seed.params.seed_status = DealModel.fail
91
91
  self._done.push(seed)
92
92
  continue
@@ -79,8 +79,8 @@ class Launcher(threading.Thread):
79
79
  self._done_queue_max_size = setting.DONE_QUEUE_MAX_SIZE
80
80
  self._upload_queue_max_size = setting.UPLOAD_QUEUE_MAX_SIZE
81
81
 
82
- self._spider_thread_num = setting.SPIDER_MAX_RETRIES
83
- self._spider_max_retries = setting.SPIDER_THREAD_NUM
82
+ self._spider_max_retries = setting.SPIDER_MAX_RETRIES
83
+ self._spider_thread_num = setting.SPIDER_THREAD_NUM
84
84
 
85
85
  self._done_model = setting.DONE_MODEL
86
86
  self._task_model = setting.TASK_MODEL
@@ -36,31 +36,27 @@ class LauncherPro(Launcher):
36
36
  def _execute_heartbeat(self):
37
37
  while not self._stop.is_set():
38
38
  if self._heartbeat_start_event.is_set():
39
- self._db.setex(self._heartbeat_key, 3)
40
- time.sleep(2)
39
+ self._db.setex(self._heartbeat_key, 5)
40
+ time.sleep(3)
41
41
 
42
42
  def _reset(self):
43
43
  """
44
44
  检查过期种子,重新添加到redis缓存中
45
45
  """
46
- init = True
47
46
  while not self._pause.is_set():
48
47
  reset_wait_seconds = 30
49
- start_reset_time = int(time.time())
50
48
  if self._db.lock(self._reset_lock_key, t=120):
51
- if not self.heartbeat:
52
- self._heartbeat_start_event.set()
53
49
 
54
50
  _min = -int(time.time()) + self._seed_reset_seconds \
55
- if self.heartbeat or not init else "-inf"
51
+ if self.heartbeat else "-inf"
56
52
 
57
53
  self._db.members(self._todo_key, 0, _min=_min, _max="(0")
58
54
  self._db.delete(self._reset_lock_key)
59
55
 
60
- ttl = 120 - int(time.time()) + start_reset_time
61
- reset_wait_seconds = max(ttl, 1)
56
+ if not self.heartbeat:
57
+ self._heartbeat_start_event.set()
58
+
62
59
  time.sleep(reset_wait_seconds)
63
- init = False
64
60
 
65
61
  def _scheduler(self):
66
62
  """
@@ -111,7 +107,7 @@ class LauncherPro(Launcher):
111
107
  refresh_time = int(time.time())
112
108
  seeds = {k:-refresh_time - v / 1000 for k, v in self.__DOING__.items()}
113
109
  self._db.zadd(self._todo_key, item=seeds, xx=True)
114
- time.sleep(30)
110
+ time.sleep(15)
115
111
 
116
112
  def _delete(self):
117
113
  """
@@ -45,7 +45,7 @@ TODO_QUEUE_FULL_WAIT_SECONDS = 5 # todo队列已满时等待时间
45
45
  NEW_QUEUE_WAIT_SECONDS = 30 # new队列等待时间
46
46
  DONE_QUEUE_WAIT_SECONDS = 15 # done队列等待时间
47
47
  UPLOAD_QUEUE_WAIT_SECONDS = 15 # upload队列等待时间
48
- SEED_RESET_SECONDS = 300 # 种子重制时间
48
+ SEED_RESET_SECONDS = 30 # 种子重制时间
49
49
 
50
50
 
51
51
  # Launcher 队列长度
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: cobweb-launcher
3
- Version: 1.2.5
3
+ Version: 1.2.6
4
4
  Summary: spider_hole
5
5
  Home-page: https://github.com/Juannie-PP/cobweb
6
6
  Author: Juannie-PP
@@ -5,7 +5,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
5
5
 
6
6
  setup(
7
7
  name="cobweb-launcher",
8
- version="1.2.5",
8
+ version="1.2.6",
9
9
  packages=find_packages(),
10
10
  url="https://github.com/Juannie-PP/cobweb",
11
11
  license="MIT",
File without changes