cobweb-launcher 1.1.9__tar.gz → 1.1.10__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of cobweb-launcher might be problematic. Click here for more details.

Files changed (37) hide show
  1. {cobweb-launcher-1.1.9/cobweb_launcher.egg-info → cobweb-launcher-1.1.10}/PKG-INFO +1 -1
  2. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/__init__.py +1 -1
  3. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/constant.py +1 -1
  4. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/crawlers/file_crawler.py +3 -3
  5. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/launchers/launcher.py +1 -1
  6. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/setting.py +1 -0
  7. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/utils/oss.py +3 -0
  8. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10/cobweb_launcher.egg-info}/PKG-INFO +1 -1
  9. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/setup.py +1 -1
  10. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/LICENSE +0 -0
  11. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/README.md +0 -0
  12. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/base/__init__.py +0 -0
  13. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/base/common_queue.py +0 -0
  14. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/base/decorators.py +0 -0
  15. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/base/item.py +0 -0
  16. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/base/log.py +0 -0
  17. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/base/request.py +0 -0
  18. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/base/response.py +0 -0
  19. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/base/seed.py +0 -0
  20. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/crawlers/__init__.py +0 -0
  21. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/crawlers/base_crawler.py +0 -0
  22. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/db/__init__.py +0 -0
  23. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/db/redis_db.py +0 -0
  24. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/exceptions/__init__.py +0 -0
  25. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/exceptions/oss_db_exception.py +0 -0
  26. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/launchers/__init__.py +0 -0
  27. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/launchers/launcher_pro.py +0 -0
  28. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/pipelines/__init__.py +0 -0
  29. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/pipelines/base_pipeline.py +0 -0
  30. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/pipelines/loghub_pipeline.py +0 -0
  31. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/utils/__init__.py +0 -0
  32. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb/utils/tools.py +0 -0
  33. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb_launcher.egg-info/SOURCES.txt +0 -0
  34. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb_launcher.egg-info/dependency_links.txt +0 -0
  35. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb_launcher.egg-info/requires.txt +0 -0
  36. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/cobweb_launcher.egg-info/top_level.txt +0 -0
  37. {cobweb-launcher-1.1.9 → cobweb-launcher-1.1.10}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: cobweb-launcher
3
- Version: 1.1.9
3
+ Version: 1.1.10
4
4
  Summary: spider_hole
5
5
  Home-page: https://github.com/Juannie-PP/cobweb
6
6
  Author: Juannie-PP
@@ -1,2 +1,2 @@
1
1
  from .launchers import Launcher, LauncherPro
2
- from .constant import Crawler
2
+ from .constant import CrawlerModel
@@ -1,5 +1,5 @@
1
1
 
2
- class Crawler:
2
+ class CrawlerModel:
3
3
 
4
4
  default = "cobweb.crawlers.Crawler"
5
5
  file_air = "cobweb.crawlers.FileCrawlerAir"
@@ -17,7 +17,7 @@ class FileCrawlerAir(Crawler):
17
17
  seed_dict = item.seed.to_dict
18
18
  bucket_name = oss_util.bucket
19
19
  try:
20
- key = item.seed.oss_path
20
+ key = item.seed.oss_path or getattr(item, "oss_path", None)
21
21
  if oss_util.exists(key):
22
22
  content_length = oss_util.head(key).content_length
23
23
  yield Response(item.seed, "exists", bucket_name=bucket_name, data_size=content_length, **seed_dict)
@@ -90,14 +90,14 @@ class FileCrawlerAir(Crawler):
90
90
  yield Seed(seed_dict, identifier="merge")
91
91
 
92
92
 
93
- class FileCrawlerPro(Crawler):
93
+ class VideoCrawler(FileCrawlerAir):
94
94
 
95
95
  @staticmethod
96
96
  def download(item: Request) -> Union[Seed, BaseItem, Response, str]:
97
97
  seed_dict = item.seed.to_dict
98
98
  bucket_name = oss_util.bucket
99
99
  try:
100
- key = item.seed.oss_path
100
+ key = item.seed.oss_path or getattr(item, "oss_path", None)
101
101
  if oss_util.exists(key):
102
102
  content_length = oss_util.head(key).content_length
103
103
  yield Response(item.seed, "exists", bucket_name=bucket_name, data_size=content_length, **seed_dict)
@@ -59,7 +59,7 @@ class Launcher(threading.Thread):
59
59
  _setting.update(**kwargs)
60
60
 
61
61
  for k, v in _setting.items():
62
- setattr(setting, k, v)
62
+ setattr(setting, k.upper(), v)
63
63
 
64
64
  self._Crawler = dynamic_load_class(setting.CRAWLER)
65
65
  self._Pipeline = dynamic_load_class(setting.PIPELINE)
@@ -26,6 +26,7 @@ OSS_SECRET_KEY = os.getenv("OSS_SECRET_KEY")
26
26
  OSS_CHUNK_SIZE = 10 * 1024 ** 2
27
27
  OSS_MIN_UPLOAD_SIZE = 1024
28
28
 
29
+
29
30
  # 采集器选择
30
31
  CRAWLER = "cobweb.crawlers.Crawler"
31
32
 
@@ -15,11 +15,13 @@ class OssUtil:
15
15
  secret_key=None,
16
16
  chunk_size=None,
17
17
  min_upload_size=None,
18
+ **kwargs
18
19
  ):
19
20
  self.bucket = bucket or setting.OSS_BUCKET
20
21
  self.endpoint = endpoint or setting.OSS_ENDPOINT
21
22
  self.chunk_size = int(chunk_size or setting.OSS_CHUNK_SIZE)
22
23
  self.min_upload_size = int(min_upload_size or setting.OSS_MIN_UPLOAD_SIZE)
24
+
23
25
  self._auth = Auth(
24
26
  access_key_id=access_key or setting.OSS_ACCESS_KEY,
25
27
  access_key_secret=secret_key or setting.OSS_SECRET_KEY
@@ -28,6 +30,7 @@ class OssUtil:
28
30
  auth=self._auth,
29
31
  endpoint=self.endpoint,
30
32
  bucket_name=self.bucket,
33
+ **kwargs
31
34
  )
32
35
 
33
36
  def exists(self, key: str) -> bool:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: cobweb-launcher
3
- Version: 1.1.9
3
+ Version: 1.1.10
4
4
  Summary: spider_hole
5
5
  Home-page: https://github.com/Juannie-PP/cobweb
6
6
  Author: Juannie-PP
@@ -5,7 +5,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
5
5
 
6
6
  setup(
7
7
  name="cobweb-launcher",
8
- version="1.1.9",
8
+ version="1.1.10",
9
9
  packages=find_packages(),
10
10
  url="https://github.com/Juannie-PP/cobweb",
11
11
  license="MIT",