parsehub 2.0.26__tar.gz → 2.0.28__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {parsehub-2.0.26/src/parsehub.egg-info → parsehub-2.0.28}/PKG-INFO +1 -1
- {parsehub-2.0.26 → parsehub-2.0.28}/pyproject.toml +1 -1
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/douyin.py +9 -2
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/twitter.py +1 -11
- {parsehub-2.0.26 → parsehub-2.0.28/src/parsehub.egg-info}/PKG-INFO +1 -1
- {parsehub-2.0.26 → parsehub-2.0.28}/LICENSE +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/README.md +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/setup.cfg +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/__init__.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/__init__.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/cli.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/cli_config.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/config/__init__.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/config/config.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/errors.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/__init__.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/base/__init__.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/base/base.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/base/ytdlp.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/__init__.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/bilibili.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/coolapk.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/facebook.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/instagram.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/kuaishou.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/pipix.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/threads.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/tieba.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/tiktok.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/twitter.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/weibo.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/weixin.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/xhs.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/xiaoheihe.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/youtube.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/parsers/parser/zuiyou.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/__init__.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/bilibili.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/coolapk.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/douyin.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/instagram.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/kuaishou.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/pipix.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/threads.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/tieba.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/tiktok.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/weibo.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/weixin.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/xhs.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/xiaoheihe.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/provider_api/zuiyou.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/types/__init__.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/types/callback.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/types/media_file.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/types/media_ref.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/types/platform.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/types/post.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/types/result.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/utils/downloader.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/utils/media_info.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub/utils/utils.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub.egg-info/SOURCES.txt +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub.egg-info/dependency_links.txt +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub.egg-info/entry_points.txt +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub.egg-info/requires.txt +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/src/parsehub.egg-info/top_level.txt +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/test/test_cli.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/test/test_cli_config.py +0 -0
- {parsehub-2.0.26 → parsehub-2.0.28}/test/test_core_offline.py +0 -0
|
@@ -12,6 +12,7 @@ from ...types import (
|
|
|
12
12
|
LivePhotoRef,
|
|
13
13
|
MultimediaParseResult,
|
|
14
14
|
ParseError,
|
|
15
|
+
ParseResult,
|
|
15
16
|
Platform,
|
|
16
17
|
VideoParseResult,
|
|
17
18
|
VideoRef,
|
|
@@ -57,13 +58,13 @@ class DouyinParser(BaseParser):
|
|
|
57
58
|
@staticmethod
|
|
58
59
|
def _build_image_result(result: "DouyinApiResult") -> ImageParseResult:
|
|
59
60
|
"""构建图片解析结果"""
|
|
60
|
-
return
|
|
61
|
+
return DouyinImageParseResult(
|
|
61
62
|
title=result.desc,
|
|
62
63
|
photo=result.image_list,
|
|
63
64
|
)
|
|
64
65
|
|
|
65
66
|
|
|
66
|
-
class
|
|
67
|
+
class DouyinParseResult(ParseResult):
|
|
67
68
|
async def _do_download(
|
|
68
69
|
self,
|
|
69
70
|
*,
|
|
@@ -87,6 +88,12 @@ class DouyinVideoParseResult(VideoParseResult):
|
|
|
87
88
|
)
|
|
88
89
|
|
|
89
90
|
|
|
91
|
+
class DouyinVideoParseResult(DouyinParseResult, VideoParseResult): ...
|
|
92
|
+
|
|
93
|
+
|
|
94
|
+
class DouyinImageParseResult(DouyinParseResult, ImageParseResult): ...
|
|
95
|
+
|
|
96
|
+
|
|
90
97
|
def remove_video_watermark(url: str) -> str:
|
|
91
98
|
"""移除抖音视频水印标识 (playwm -> play)"""
|
|
92
99
|
return url.replace("playwm", "play")
|
|
@@ -29,14 +29,13 @@ class Twitter:
|
|
|
29
29
|
"authorization": self.authorization,
|
|
30
30
|
"content-type": "application/json",
|
|
31
31
|
"user-agent": GlobalConfig.ua,
|
|
32
|
-
"x-guest-token": await self.get_guest_token(url),
|
|
33
32
|
"x-twitter-active-user": "yes",
|
|
34
33
|
"x-twitter-client-language": "zh-cn",
|
|
35
34
|
}
|
|
36
35
|
|
|
37
36
|
cookie = None
|
|
38
37
|
if self.cookie and self.check_cookie():
|
|
39
|
-
headers["x-csrf-token"] = self.cookie.get("ct0")
|
|
38
|
+
headers["x-csrf-token"] = self.cookie.get("ct0", "")
|
|
40
39
|
cookie = self.cookie
|
|
41
40
|
|
|
42
41
|
params = {
|
|
@@ -158,15 +157,6 @@ class Twitter:
|
|
|
158
157
|
raise ValueError(f"Invalid tweet url: {url}")
|
|
159
158
|
return match[1]
|
|
160
159
|
|
|
161
|
-
async def get_guest_token(self, url: str):
|
|
162
|
-
async with httpx.AsyncClient(proxy=self.proxy) as client:
|
|
163
|
-
response = await client.post(url)
|
|
164
|
-
response.raise_for_status()
|
|
165
|
-
guest_token = re.search(r'cookie="gt=(\d+);', response.text)
|
|
166
|
-
if not guest_token:
|
|
167
|
-
raise Exception("error -5: 获取 guest_token 失败")
|
|
168
|
-
return guest_token[1]
|
|
169
|
-
|
|
170
160
|
def check_cookie(self) -> bool:
|
|
171
161
|
if not self.cookie:
|
|
172
162
|
return False
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|