cobweb-launcher 1.2.61__tar.gz → 1.2.62__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {cobweb-launcher-1.2.61/cobweb_launcher.egg-info → cobweb-launcher-1.2.62}/PKG-INFO +1 -1
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/crawlers/crawler.py +1 -1
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/launchers/launcher.py +2 -2
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/launchers/launcher_air.py +11 -6
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/launchers/launcher_api.py +12 -6
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/launchers/launcher_pro.py +12 -6
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62/cobweb_launcher.egg-info}/PKG-INFO +1 -1
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/setup.py +1 -1
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/LICENSE +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/README.md +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/__init__.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/base/__init__.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/base/common_queue.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/base/decorators.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/base/item.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/base/log.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/base/request.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/base/response.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/base/seed.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/constant.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/crawlers/__init__.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/crawlers/base_crawler.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/crawlers/file_crawler.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/db/__init__.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/db/api_db.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/db/redis_db.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/db/redis_db_new.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/exceptions/__init__.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/exceptions/oss_db_exception.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/launchers/__init__.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/pipelines/__init__.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/pipelines/pipeline.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/pipelines/pipeline_console.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/pipelines/pipeline_loghub.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/setting.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/utils/__init__.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/utils/bloom.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/utils/dotting.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/utils/oss.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb/utils/tools.py +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb_launcher.egg-info/SOURCES.txt +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb_launcher.egg-info/dependency_links.txt +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb_launcher.egg-info/requires.txt +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb_launcher.egg-info/top_level.txt +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/setup.cfg +0 -0
- {cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/test/test.py +0 -0
@@ -83,7 +83,7 @@ class Crawler(threading.Thread):
|
|
83
83
|
if isinstance(item, BaseItem):
|
84
84
|
self._upload_data(item)
|
85
85
|
elif isinstance(item, Seed):
|
86
|
-
self._add_seed(item)
|
86
|
+
self._add_seed((seed, item))
|
87
87
|
elif isinstance(item, str) and item == DealModel.poll:
|
88
88
|
self._set_seed(seed)
|
89
89
|
elif isinstance(item, str) and item == DealModel.done:
|
@@ -173,8 +173,8 @@ class Launcher(threading.Thread):
|
|
173
173
|
def _upload_data(self, data, **kwargs):
|
174
174
|
self.__LAUNCHER_QUEUE__["upload"].push(data, **kwargs)
|
175
175
|
|
176
|
-
def _add_seed(self,
|
177
|
-
self.__LAUNCHER_QUEUE__["new"].push(
|
176
|
+
def _add_seed(self, seeds, **kwargs):
|
177
|
+
self.__LAUNCHER_QUEUE__["new"].push(seeds, direct_insertion=True, **kwargs)
|
178
178
|
|
179
179
|
def _delete_seed(self, seed, **kwargs):
|
180
180
|
self.__LAUNCHER_QUEUE__["done"].push(seed, **kwargs)
|
@@ -13,15 +13,20 @@ class LauncherAir(Launcher):
|
|
13
13
|
|
14
14
|
@check_pause
|
15
15
|
def _insert(self):
|
16
|
-
|
16
|
+
new_seeds = {}
|
17
|
+
del_seeds = set()
|
17
18
|
status = self.__LAUNCHER_QUEUE__['new'].length < self._new_queue_max_size
|
18
19
|
for _ in range(self._new_queue_max_size):
|
19
|
-
|
20
|
-
if not
|
20
|
+
seed_tuple = self.__LAUNCHER_QUEUE__['new'].pop()
|
21
|
+
if not seed_tuple:
|
21
22
|
break
|
22
|
-
|
23
|
-
|
24
|
-
|
23
|
+
seed, new_seed = seed_tuple
|
24
|
+
new_seeds[new_seed.to_string] = new_seed.params.priority
|
25
|
+
del_seeds.add(seed.to_string)
|
26
|
+
if new_seeds:
|
27
|
+
self.__LAUNCHER_QUEUE__['todo'].push(new_seeds)
|
28
|
+
if del_seeds:
|
29
|
+
self.__LAUNCHER_QUEUE__['done'].push(del_seeds)
|
25
30
|
if status:
|
26
31
|
time.sleep(self._new_queue_wait_seconds)
|
27
32
|
|
@@ -106,14 +106,20 @@ class LauncherApi(Launcher):
|
|
106
106
|
"""
|
107
107
|
添加新种子到redis队列中
|
108
108
|
"""
|
109
|
-
|
109
|
+
new_seeds = {}
|
110
|
+
del_seeds = set()
|
110
111
|
status = self.__LAUNCHER_QUEUE__['new'].length < self._new_queue_max_size
|
111
112
|
for _ in range(self._new_queue_max_size):
|
112
|
-
|
113
|
-
if
|
114
|
-
|
115
|
-
|
116
|
-
|
113
|
+
seed_tuple = self.__LAUNCHER_QUEUE__['new'].pop()
|
114
|
+
if not seed_tuple:
|
115
|
+
break
|
116
|
+
seed, new_seed = seed_tuple
|
117
|
+
new_seeds[new_seed.to_string] = new_seed.params.priority
|
118
|
+
del_seeds.add(seed.to_string)
|
119
|
+
if new_seeds:
|
120
|
+
self._db.zadd(self._todo_key, new_seeds, nx=True)
|
121
|
+
if del_seeds:
|
122
|
+
self.__LAUNCHER_QUEUE__['done'].push(del_seeds)
|
117
123
|
if status:
|
118
124
|
time.sleep(self._new_queue_wait_seconds)
|
119
125
|
|
@@ -108,14 +108,20 @@ class LauncherPro(Launcher):
|
|
108
108
|
"""
|
109
109
|
添加新种子到redis队列中
|
110
110
|
"""
|
111
|
-
|
111
|
+
new_seeds = {}
|
112
|
+
del_seeds = set()
|
112
113
|
status = self.__LAUNCHER_QUEUE__['new'].length < self._new_queue_max_size
|
113
114
|
for _ in range(self._new_queue_max_size):
|
114
|
-
|
115
|
-
if
|
116
|
-
|
117
|
-
|
118
|
-
|
115
|
+
seed_tuple = self.__LAUNCHER_QUEUE__['new'].pop()
|
116
|
+
if not seed_tuple:
|
117
|
+
break
|
118
|
+
seed, new_seed = seed_tuple
|
119
|
+
new_seeds[new_seed.to_string] = new_seed.params.priority
|
120
|
+
del_seeds.add(seed.to_string)
|
121
|
+
if new_seeds:
|
122
|
+
self._db.zadd(self._todo_key, new_seeds, nx=True)
|
123
|
+
if del_seeds:
|
124
|
+
self.__LAUNCHER_QUEUE__['done'].push(del_seeds)
|
119
125
|
if status:
|
120
126
|
time.sleep(self._new_queue_wait_seconds)
|
121
127
|
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{cobweb-launcher-1.2.61 → cobweb-launcher-1.2.62}/cobweb_launcher.egg-info/dependency_links.txt
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|