webscout 8.3.7__py3-none-any.whl → 2025.10.11__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of webscout might be problematic. Click here for more details.
- webscout/AIauto.py +250 -250
- webscout/AIbase.py +379 -379
- webscout/AIutel.py +60 -60
- webscout/Bard.py +1012 -1012
- webscout/Bing_search.py +417 -417
- webscout/DWEBS.py +529 -529
- webscout/Extra/Act.md +309 -309
- webscout/Extra/GitToolkit/__init__.py +10 -10
- webscout/Extra/GitToolkit/gitapi/README.md +110 -110
- webscout/Extra/GitToolkit/gitapi/__init__.py +11 -11
- webscout/Extra/GitToolkit/gitapi/repository.py +195 -195
- webscout/Extra/GitToolkit/gitapi/user.py +96 -96
- webscout/Extra/GitToolkit/gitapi/utils.py +61 -61
- webscout/Extra/YTToolkit/README.md +375 -375
- webscout/Extra/YTToolkit/YTdownloader.py +956 -956
- webscout/Extra/YTToolkit/__init__.py +2 -2
- webscout/Extra/YTToolkit/transcriber.py +475 -475
- webscout/Extra/YTToolkit/ytapi/README.md +44 -44
- webscout/Extra/YTToolkit/ytapi/__init__.py +6 -6
- webscout/Extra/YTToolkit/ytapi/channel.py +307 -307
- webscout/Extra/YTToolkit/ytapi/errors.py +13 -13
- webscout/Extra/YTToolkit/ytapi/extras.py +118 -118
- webscout/Extra/YTToolkit/ytapi/https.py +88 -88
- webscout/Extra/YTToolkit/ytapi/patterns.py +61 -61
- webscout/Extra/YTToolkit/ytapi/playlist.py +58 -58
- webscout/Extra/YTToolkit/ytapi/pool.py +7 -7
- webscout/Extra/YTToolkit/ytapi/query.py +39 -39
- webscout/Extra/YTToolkit/ytapi/stream.py +62 -62
- webscout/Extra/YTToolkit/ytapi/utils.py +62 -62
- webscout/Extra/YTToolkit/ytapi/video.py +232 -232
- webscout/Extra/autocoder/__init__.py +9 -9
- webscout/Extra/autocoder/autocoder.py +1105 -1105
- webscout/Extra/autocoder/autocoder_utiles.py +332 -332
- webscout/Extra/gguf.md +429 -429
- webscout/Extra/gguf.py +1213 -1213
- webscout/Extra/tempmail/README.md +487 -487
- webscout/Extra/tempmail/__init__.py +27 -27
- webscout/Extra/tempmail/async_utils.py +140 -140
- webscout/Extra/tempmail/base.py +160 -160
- webscout/Extra/tempmail/cli.py +186 -186
- webscout/Extra/tempmail/emailnator.py +84 -84
- webscout/Extra/tempmail/mail_tm.py +360 -360
- webscout/Extra/tempmail/temp_mail_io.py +291 -291
- webscout/Extra/weather.md +281 -281
- webscout/Extra/weather.py +193 -193
- webscout/Litlogger/README.md +10 -10
- webscout/Litlogger/__init__.py +15 -15
- webscout/Litlogger/formats.py +13 -13
- webscout/Litlogger/handlers.py +121 -121
- webscout/Litlogger/levels.py +13 -13
- webscout/Litlogger/logger.py +134 -134
- webscout/Provider/AISEARCH/Perplexity.py +332 -332
- webscout/Provider/AISEARCH/README.md +279 -279
- webscout/Provider/AISEARCH/__init__.py +16 -1
- webscout/Provider/AISEARCH/felo_search.py +206 -206
- webscout/Provider/AISEARCH/genspark_search.py +323 -323
- webscout/Provider/AISEARCH/hika_search.py +185 -185
- webscout/Provider/AISEARCH/iask_search.py +410 -410
- webscout/Provider/AISEARCH/monica_search.py +219 -219
- webscout/Provider/AISEARCH/scira_search.py +316 -316
- webscout/Provider/AISEARCH/stellar_search.py +177 -177
- webscout/Provider/AISEARCH/webpilotai_search.py +255 -255
- webscout/Provider/Aitopia.py +314 -314
- webscout/Provider/Apriel.py +306 -0
- webscout/Provider/ChatGPTClone.py +236 -236
- webscout/Provider/ChatSandbox.py +343 -343
- webscout/Provider/Cloudflare.py +324 -324
- webscout/Provider/Cohere.py +208 -208
- webscout/Provider/Deepinfra.py +370 -366
- webscout/Provider/ExaAI.py +260 -260
- webscout/Provider/ExaChat.py +308 -308
- webscout/Provider/Flowith.py +221 -221
- webscout/Provider/GMI.py +293 -0
- webscout/Provider/Gemini.py +164 -164
- webscout/Provider/GeminiProxy.py +167 -167
- webscout/Provider/GithubChat.py +371 -372
- webscout/Provider/Groq.py +800 -800
- webscout/Provider/HeckAI.py +383 -383
- webscout/Provider/Jadve.py +282 -282
- webscout/Provider/K2Think.py +307 -307
- webscout/Provider/Koboldai.py +205 -205
- webscout/Provider/LambdaChat.py +423 -423
- webscout/Provider/Nemotron.py +244 -244
- webscout/Provider/Netwrck.py +248 -248
- webscout/Provider/OLLAMA.py +395 -395
- webscout/Provider/OPENAI/Cloudflare.py +393 -393
- webscout/Provider/OPENAI/FalconH1.py +451 -451
- webscout/Provider/OPENAI/FreeGemini.py +296 -296
- webscout/Provider/OPENAI/K2Think.py +431 -431
- webscout/Provider/OPENAI/NEMOTRON.py +240 -240
- webscout/Provider/OPENAI/PI.py +427 -427
- webscout/Provider/OPENAI/README.md +959 -959
- webscout/Provider/OPENAI/TogetherAI.py +345 -345
- webscout/Provider/OPENAI/TwoAI.py +465 -465
- webscout/Provider/OPENAI/__init__.py +33 -18
- webscout/Provider/OPENAI/base.py +248 -248
- webscout/Provider/OPENAI/chatglm.py +528 -0
- webscout/Provider/OPENAI/chatgpt.py +592 -592
- webscout/Provider/OPENAI/chatgptclone.py +521 -521
- webscout/Provider/OPENAI/chatsandbox.py +202 -202
- webscout/Provider/OPENAI/deepinfra.py +318 -314
- webscout/Provider/OPENAI/e2b.py +1665 -1665
- webscout/Provider/OPENAI/exaai.py +420 -420
- webscout/Provider/OPENAI/exachat.py +452 -452
- webscout/Provider/OPENAI/friendli.py +232 -232
- webscout/Provider/OPENAI/{refact.py → gmi.py} +324 -274
- webscout/Provider/OPENAI/groq.py +364 -364
- webscout/Provider/OPENAI/heckai.py +314 -314
- webscout/Provider/OPENAI/llmchatco.py +337 -337
- webscout/Provider/OPENAI/netwrck.py +355 -355
- webscout/Provider/OPENAI/oivscode.py +290 -290
- webscout/Provider/OPENAI/opkfc.py +518 -518
- webscout/Provider/OPENAI/pydantic_imports.py +1 -1
- webscout/Provider/OPENAI/scirachat.py +535 -535
- webscout/Provider/OPENAI/sonus.py +308 -308
- webscout/Provider/OPENAI/standardinput.py +442 -442
- webscout/Provider/OPENAI/textpollinations.py +340 -340
- webscout/Provider/OPENAI/toolbaz.py +419 -416
- webscout/Provider/OPENAI/typefully.py +362 -362
- webscout/Provider/OPENAI/utils.py +295 -295
- webscout/Provider/OPENAI/venice.py +436 -436
- webscout/Provider/OPENAI/wisecat.py +387 -387
- webscout/Provider/OPENAI/writecream.py +166 -166
- webscout/Provider/OPENAI/x0gpt.py +378 -378
- webscout/Provider/OPENAI/yep.py +389 -389
- webscout/Provider/OpenGPT.py +230 -230
- webscout/Provider/Openai.py +243 -243
- webscout/Provider/PI.py +405 -405
- webscout/Provider/Perplexitylabs.py +430 -430
- webscout/Provider/QwenLM.py +272 -272
- webscout/Provider/STT/__init__.py +16 -1
- webscout/Provider/Sambanova.py +257 -257
- webscout/Provider/StandardInput.py +309 -309
- webscout/Provider/TTI/README.md +82 -82
- webscout/Provider/TTI/__init__.py +33 -18
- webscout/Provider/TTI/aiarta.py +413 -413
- webscout/Provider/TTI/base.py +136 -136
- webscout/Provider/TTI/bing.py +243 -243
- webscout/Provider/TTI/gpt1image.py +149 -149
- webscout/Provider/TTI/imagen.py +196 -196
- webscout/Provider/TTI/infip.py +211 -211
- webscout/Provider/TTI/magicstudio.py +232 -232
- webscout/Provider/TTI/monochat.py +219 -219
- webscout/Provider/TTI/piclumen.py +214 -214
- webscout/Provider/TTI/pixelmuse.py +232 -232
- webscout/Provider/TTI/pollinations.py +232 -232
- webscout/Provider/TTI/together.py +288 -288
- webscout/Provider/TTI/utils.py +12 -12
- webscout/Provider/TTI/venice.py +367 -367
- webscout/Provider/TTS/README.md +192 -192
- webscout/Provider/TTS/__init__.py +33 -18
- webscout/Provider/TTS/parler.py +110 -110
- webscout/Provider/TTS/streamElements.py +333 -333
- webscout/Provider/TTS/utils.py +280 -280
- webscout/Provider/TeachAnything.py +237 -237
- webscout/Provider/TextPollinationsAI.py +310 -310
- webscout/Provider/TogetherAI.py +356 -356
- webscout/Provider/TwoAI.py +312 -312
- webscout/Provider/TypliAI.py +311 -311
- webscout/Provider/UNFINISHED/ChatHub.py +208 -208
- webscout/Provider/UNFINISHED/ChutesAI.py +313 -313
- webscout/Provider/UNFINISHED/GizAI.py +294 -294
- webscout/Provider/UNFINISHED/Marcus.py +198 -198
- webscout/Provider/UNFINISHED/Qodo.py +477 -477
- webscout/Provider/UNFINISHED/VercelAIGateway.py +338 -338
- webscout/Provider/UNFINISHED/XenAI.py +324 -324
- webscout/Provider/UNFINISHED/Youchat.py +330 -330
- webscout/Provider/UNFINISHED/liner.py +334 -0
- webscout/Provider/UNFINISHED/liner_api_request.py +262 -262
- webscout/Provider/UNFINISHED/puterjs.py +634 -634
- webscout/Provider/UNFINISHED/samurai.py +223 -223
- webscout/Provider/UNFINISHED/test_lmarena.py +119 -119
- webscout/Provider/Venice.py +250 -250
- webscout/Provider/VercelAI.py +256 -256
- webscout/Provider/WiseCat.py +231 -231
- webscout/Provider/WrDoChat.py +366 -366
- webscout/Provider/__init__.py +33 -18
- webscout/Provider/ai4chat.py +174 -174
- webscout/Provider/akashgpt.py +331 -331
- webscout/Provider/cerebras.py +446 -446
- webscout/Provider/chatglm.py +394 -301
- webscout/Provider/cleeai.py +211 -211
- webscout/Provider/elmo.py +282 -282
- webscout/Provider/geminiapi.py +208 -208
- webscout/Provider/granite.py +261 -261
- webscout/Provider/hermes.py +263 -263
- webscout/Provider/julius.py +223 -223
- webscout/Provider/learnfastai.py +309 -309
- webscout/Provider/llama3mitril.py +214 -214
- webscout/Provider/llmchat.py +243 -243
- webscout/Provider/llmchatco.py +290 -290
- webscout/Provider/meta.py +801 -801
- webscout/Provider/oivscode.py +309 -309
- webscout/Provider/scira_chat.py +383 -383
- webscout/Provider/searchchat.py +292 -292
- webscout/Provider/sonus.py +258 -258
- webscout/Provider/toolbaz.py +370 -367
- webscout/Provider/turboseek.py +273 -273
- webscout/Provider/typefully.py +207 -207
- webscout/Provider/yep.py +372 -372
- webscout/__init__.py +30 -31
- webscout/__main__.py +5 -5
- webscout/auth/api_key_manager.py +189 -189
- webscout/auth/config.py +175 -175
- webscout/auth/models.py +185 -185
- webscout/auth/routes.py +664 -664
- webscout/auth/simple_logger.py +236 -236
- webscout/cli.py +523 -523
- webscout/conversation.py +438 -438
- webscout/exceptions.py +361 -361
- webscout/litagent/Readme.md +298 -298
- webscout/litagent/__init__.py +28 -28
- webscout/litagent/agent.py +581 -581
- webscout/litagent/constants.py +59 -59
- webscout/litprinter/__init__.py +58 -58
- webscout/models.py +181 -181
- webscout/optimizers.py +419 -419
- webscout/prompt_manager.py +288 -288
- webscout/sanitize.py +1078 -1078
- webscout/scout/README.md +401 -401
- webscout/scout/__init__.py +8 -8
- webscout/scout/core/__init__.py +6 -6
- webscout/scout/core/crawler.py +297 -297
- webscout/scout/core/scout.py +706 -706
- webscout/scout/core/search_result.py +95 -95
- webscout/scout/core/text_analyzer.py +62 -62
- webscout/scout/core/text_utils.py +277 -277
- webscout/scout/core/web_analyzer.py +51 -51
- webscout/scout/element.py +599 -599
- webscout/scout/parsers/__init__.py +69 -69
- webscout/scout/parsers/html5lib_parser.py +172 -172
- webscout/scout/parsers/html_parser.py +236 -236
- webscout/scout/parsers/lxml_parser.py +178 -178
- webscout/scout/utils.py +37 -37
- webscout/swiftcli/Readme.md +323 -323
- webscout/swiftcli/__init__.py +95 -95
- webscout/swiftcli/core/__init__.py +7 -7
- webscout/swiftcli/core/cli.py +308 -308
- webscout/swiftcli/core/context.py +104 -104
- webscout/swiftcli/core/group.py +241 -241
- webscout/swiftcli/decorators/__init__.py +28 -28
- webscout/swiftcli/decorators/command.py +221 -221
- webscout/swiftcli/decorators/options.py +220 -220
- webscout/swiftcli/decorators/output.py +302 -302
- webscout/swiftcli/exceptions.py +21 -21
- webscout/swiftcli/plugins/__init__.py +9 -9
- webscout/swiftcli/plugins/base.py +135 -135
- webscout/swiftcli/plugins/manager.py +269 -269
- webscout/swiftcli/utils/__init__.py +59 -59
- webscout/swiftcli/utils/formatting.py +252 -252
- webscout/swiftcli/utils/parsing.py +267 -267
- webscout/update_checker.py +117 -117
- webscout/version.py +1 -1
- webscout/webscout_search.py +1183 -1183
- webscout/webscout_search_async.py +649 -649
- webscout/yep_search.py +346 -346
- webscout/zeroart/README.md +89 -89
- webscout/zeroart/__init__.py +134 -134
- webscout/zeroart/base.py +66 -66
- webscout/zeroart/effects.py +100 -100
- webscout/zeroart/fonts.py +1238 -1238
- {webscout-8.3.7.dist-info → webscout-2025.10.11.dist-info}/METADATA +937 -937
- webscout-2025.10.11.dist-info/RECORD +300 -0
- webscout/Provider/AISEARCH/DeepFind.py +0 -254
- webscout/Provider/OPENAI/Qwen3.py +0 -303
- webscout/Provider/OPENAI/qodo.py +0 -630
- webscout/Provider/OPENAI/xenai.py +0 -514
- webscout/tempid.py +0 -134
- webscout-8.3.7.dist-info/RECORD +0 -301
- {webscout-8.3.7.dist-info → webscout-2025.10.11.dist-info}/WHEEL +0 -0
- {webscout-8.3.7.dist-info → webscout-2025.10.11.dist-info}/entry_points.txt +0 -0
- {webscout-8.3.7.dist-info → webscout-2025.10.11.dist-info}/licenses/LICENSE.md +0 -0
- {webscout-8.3.7.dist-info → webscout-2025.10.11.dist-info}/top_level.txt +0 -0
|
@@ -1,232 +1,232 @@
|
|
|
1
|
-
import re
|
|
2
|
-
import json
|
|
3
|
-
from typing import Dict, Any
|
|
4
|
-
from .https import video_data
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
class Video:
|
|
8
|
-
|
|
9
|
-
_HEAD = 'https://www.youtube.com/watch?v='
|
|
10
|
-
|
|
11
|
-
def __init__(self, video_id: str):
|
|
12
|
-
"""
|
|
13
|
-
Represents a YouTube video
|
|
14
|
-
|
|
15
|
-
Parameters
|
|
16
|
-
----------
|
|
17
|
-
video_id : str
|
|
18
|
-
The id or url of the video
|
|
19
|
-
"""
|
|
20
|
-
pattern = re.compile(r'.be/(.*?)$|=(.*?)$|^(\w{11})$') # noqa
|
|
21
|
-
match = pattern.search(video_id)
|
|
22
|
-
|
|
23
|
-
if not match:
|
|
24
|
-
raise ValueError('Invalid YouTube video ID or URL')
|
|
25
|
-
|
|
26
|
-
self._matched_id = (
|
|
27
|
-
match.group(1)
|
|
28
|
-
or match.group(2)
|
|
29
|
-
or match.group(3)
|
|
30
|
-
)
|
|
31
|
-
|
|
32
|
-
if self._matched_id:
|
|
33
|
-
self._url = self._HEAD + self._matched_id
|
|
34
|
-
self._video_data = video_data(self._matched_id)
|
|
35
|
-
# Extract basic info for fallback
|
|
36
|
-
title_match = re.search(r'<title>(.*?) - YouTube</title>', self._video_data)
|
|
37
|
-
self.title = title_match.group(1) if title_match else None
|
|
38
|
-
self.id = self._matched_id
|
|
39
|
-
else:
|
|
40
|
-
raise ValueError('Invalid YouTube video ID or URL')
|
|
41
|
-
|
|
42
|
-
def __repr__(self):
|
|
43
|
-
return f'<Video {self._url}>'
|
|
44
|
-
|
|
45
|
-
@property
|
|
46
|
-
def metadata(self) -> Dict[str, Any]:
|
|
47
|
-
"""
|
|
48
|
-
Fetches video metadata in a dict format
|
|
49
|
-
|
|
50
|
-
Returns
|
|
51
|
-
-------
|
|
52
|
-
Dict
|
|
53
|
-
Video metadata in a dict format containing keys: title, id, views, duration, author_id,
|
|
54
|
-
upload_date, url, thumbnails, tags, description, likes, genre, etc.
|
|
55
|
-
"""
|
|
56
|
-
# Multiple patterns to try for video details extraction for robustness
|
|
57
|
-
details_patterns = [
|
|
58
|
-
re.compile(r'videoDetails\":(.*?)\"isLiveContent\":.*?}'),
|
|
59
|
-
re.compile(r'videoDetails\":(.*?),\"playerConfig'),
|
|
60
|
-
re.compile(r'videoDetails\":(.*?),\"playabilityStatus')
|
|
61
|
-
]
|
|
62
|
-
|
|
63
|
-
# Other metadata patterns
|
|
64
|
-
upload_date_pattern = re.compile(r"<meta itemprop=\"uploadDate\" content=\"(.*?)\">")
|
|
65
|
-
genre_pattern = re.compile(r"<meta itemprop=\"genre\" content=\"(.*?)\">")
|
|
66
|
-
like_count_patterns = [
|
|
67
|
-
re.compile(r"iconType\":\"LIKE\"},\"defaultText\":(.*?)}"),
|
|
68
|
-
re.compile(r'\"likeCount\":\"(\d+)\"')
|
|
69
|
-
]
|
|
70
|
-
channel_name_pattern = re.compile(r'"ownerChannelName":"(.*?)"')
|
|
71
|
-
|
|
72
|
-
# Try each pattern for video details
|
|
73
|
-
raw_details_match = None
|
|
74
|
-
for pattern in details_patterns:
|
|
75
|
-
match = pattern.search(self._video_data)
|
|
76
|
-
if match:
|
|
77
|
-
raw_details_match = match
|
|
78
|
-
break
|
|
79
|
-
|
|
80
|
-
if not raw_details_match:
|
|
81
|
-
# Fallback metadata for search results or incomplete video data
|
|
82
|
-
return {
|
|
83
|
-
'title': getattr(self, 'title', None),
|
|
84
|
-
'id': getattr(self, 'id', None),
|
|
85
|
-
'views': getattr(self, 'views', None),
|
|
86
|
-
'streamed': False,
|
|
87
|
-
'duration': None,
|
|
88
|
-
'author_id': None,
|
|
89
|
-
'author_name': None,
|
|
90
|
-
'upload_date': None,
|
|
91
|
-
'url': f"https://www.youtube.com/watch?v={getattr(self, 'id', '')}" if hasattr(self, 'id') else None,
|
|
92
|
-
'thumbnails': None,
|
|
93
|
-
'tags': None,
|
|
94
|
-
'description': None,
|
|
95
|
-
'likes': None,
|
|
96
|
-
'genre': None,
|
|
97
|
-
'is_age_restricted': 'age-restricted' in self._video_data.lower(),
|
|
98
|
-
'is_unlisted': 'unlisted' in self._video_data.lower()
|
|
99
|
-
}
|
|
100
|
-
|
|
101
|
-
raw_details = raw_details_match.group(0)
|
|
102
|
-
|
|
103
|
-
# Extract upload date
|
|
104
|
-
upload_date_match = upload_date_pattern.search(self._video_data)
|
|
105
|
-
upload_date = upload_date_match.group(1) if upload_date_match else None
|
|
106
|
-
|
|
107
|
-
# Extract channel name
|
|
108
|
-
channel_name_match = channel_name_pattern.search(self._video_data)
|
|
109
|
-
channel_name = channel_name_match.group(1) if channel_name_match else None
|
|
110
|
-
|
|
111
|
-
# Parse video details
|
|
112
|
-
try:
|
|
113
|
-
# Clean up the JSON string for parsing
|
|
114
|
-
clean_json = raw_details.replace('videoDetails\":', '')
|
|
115
|
-
# Handle potential JSON parsing issues
|
|
116
|
-
if clean_json.endswith(','):
|
|
117
|
-
clean_json = clean_json[:-1]
|
|
118
|
-
metadata = json.loads(clean_json)
|
|
119
|
-
|
|
120
|
-
data = {
|
|
121
|
-
'title': metadata.get('title'),
|
|
122
|
-
'id': metadata.get('videoId', self._matched_id),
|
|
123
|
-
'views': metadata.get('viewCount'),
|
|
124
|
-
'streamed': metadata.get('isLiveContent', False),
|
|
125
|
-
'duration': metadata.get('lengthSeconds'),
|
|
126
|
-
'author_id': metadata.get('channelId'),
|
|
127
|
-
'author_name': channel_name or metadata.get('author'),
|
|
128
|
-
'upload_date': upload_date,
|
|
129
|
-
'url': f"https://www.youtube.com/watch?v={metadata.get('videoId', self._matched_id)}",
|
|
130
|
-
'thumbnails': metadata.get('thumbnail', {}).get('thumbnails'),
|
|
131
|
-
'tags': metadata.get('keywords'),
|
|
132
|
-
'description': metadata.get('shortDescription'),
|
|
133
|
-
'is_age_restricted': metadata.get('isAgeRestricted', False) or 'age-restricted' in self._video_data.lower(),
|
|
134
|
-
'is_unlisted': 'unlisted' in self._video_data.lower(),
|
|
135
|
-
'is_family_safe': metadata.get('isFamilySafe', True),
|
|
136
|
-
'is_private': metadata.get('isPrivate', False),
|
|
137
|
-
'is_live_content': metadata.get('isLiveContent', False),
|
|
138
|
-
'is_crawlable': metadata.get('isCrawlable', True),
|
|
139
|
-
'allow_ratings': metadata.get('allowRatings', True)
|
|
140
|
-
}
|
|
141
|
-
except (json.JSONDecodeError, KeyError, TypeError) as e:
|
|
142
|
-
# Fallback to basic metadata if JSON parsing fails
|
|
143
|
-
return {
|
|
144
|
-
'title': getattr(self, 'title', None),
|
|
145
|
-
'id': self._matched_id,
|
|
146
|
-
'url': self._url,
|
|
147
|
-
'error': f"Failed to parse video details: {str(e)}"
|
|
148
|
-
}
|
|
149
|
-
|
|
150
|
-
# Try to extract likes count
|
|
151
|
-
likes = None
|
|
152
|
-
for pattern in like_count_patterns:
|
|
153
|
-
try:
|
|
154
|
-
likes_match = pattern.search(self._video_data)
|
|
155
|
-
if likes_match:
|
|
156
|
-
likes_text = likes_match.group(1)
|
|
157
|
-
# Handle different formats of like count
|
|
158
|
-
if '{' in likes_text:
|
|
159
|
-
likes = json.loads(likes_text + '}}}')['accessibility']['accessibilityData']['label'].split(' ')[0].replace(',', '')
|
|
160
|
-
else:
|
|
161
|
-
likes = likes_text
|
|
162
|
-
break
|
|
163
|
-
except (AttributeError, KeyError, json.decoder.JSONDecodeError):
|
|
164
|
-
continue
|
|
165
|
-
|
|
166
|
-
data['likes'] = likes
|
|
167
|
-
|
|
168
|
-
# Try to extract genre
|
|
169
|
-
try:
|
|
170
|
-
genre_match = genre_pattern.search(self._video_data)
|
|
171
|
-
data['genre'] = genre_match.group(1) if genre_match else None
|
|
172
|
-
except AttributeError:
|
|
173
|
-
data['genre'] = None
|
|
174
|
-
|
|
175
|
-
return data
|
|
176
|
-
|
|
177
|
-
|
|
178
|
-
|
|
179
|
-
@property
|
|
180
|
-
def embed_html(self) -> str:
|
|
181
|
-
"""
|
|
182
|
-
Get the embed HTML code for this video
|
|
183
|
-
|
|
184
|
-
Returns:
|
|
185
|
-
HTML iframe code for embedding the video
|
|
186
|
-
"""
|
|
187
|
-
return f'<iframe width="560" height="315" src="https://www.youtube.com/embed/{self._matched_id}" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>'
|
|
188
|
-
|
|
189
|
-
@property
|
|
190
|
-
def embed_url(self) -> str:
|
|
191
|
-
"""
|
|
192
|
-
Get the embed URL for this video
|
|
193
|
-
|
|
194
|
-
Returns:
|
|
195
|
-
URL for embedding the video
|
|
196
|
-
"""
|
|
197
|
-
return f'https://www.youtube.com/embed/{self._matched_id}'
|
|
198
|
-
|
|
199
|
-
@property
|
|
200
|
-
def thumbnail_url(self) -> str:
|
|
201
|
-
"""
|
|
202
|
-
Get the thumbnail URL for this video
|
|
203
|
-
|
|
204
|
-
Returns:
|
|
205
|
-
URL of the video thumbnail (high quality)
|
|
206
|
-
"""
|
|
207
|
-
return f'https://i.ytimg.com/vi/{self._matched_id}/hqdefault.jpg'
|
|
208
|
-
|
|
209
|
-
@property
|
|
210
|
-
def thumbnail_urls(self) -> Dict[str, str]:
|
|
211
|
-
"""
|
|
212
|
-
Get all thumbnail URLs for this video in different qualities
|
|
213
|
-
|
|
214
|
-
Returns:
|
|
215
|
-
Dictionary of thumbnail URLs with quality labels
|
|
216
|
-
"""
|
|
217
|
-
return {
|
|
218
|
-
'default': f'https://i.ytimg.com/vi/{self._matched_id}/default.jpg',
|
|
219
|
-
'medium': f'https://i.ytimg.com/vi/{self._matched_id}/mqdefault.jpg',
|
|
220
|
-
'high': f'https://i.ytimg.com/vi/{self._matched_id}/hqdefault.jpg',
|
|
221
|
-
'standard': f'https://i.ytimg.com/vi/{self._matched_id}/sddefault.jpg',
|
|
222
|
-
'maxres': f'https://i.ytimg.com/vi/{self._matched_id}/maxresdefault.jpg'
|
|
223
|
-
}
|
|
224
|
-
|
|
225
|
-
if __name__ == '__main__':
|
|
226
|
-
video = Video('https://www.youtube.com/watch?v=9bZkp7q19f0')
|
|
227
|
-
print(video.metadata)
|
|
228
|
-
|
|
229
|
-
# Example of getting comments
|
|
230
|
-
print("\nFirst 3 comments:")
|
|
231
|
-
for i, comment in enumerate(video.stream_comments(3), 1):
|
|
232
|
-
print(f"{i}. {comment['author']}: {comment['text'][:50]}...")
|
|
1
|
+
import re
|
|
2
|
+
import json
|
|
3
|
+
from typing import Dict, Any
|
|
4
|
+
from .https import video_data
|
|
5
|
+
|
|
6
|
+
|
|
7
|
+
class Video:
|
|
8
|
+
|
|
9
|
+
_HEAD = 'https://www.youtube.com/watch?v='
|
|
10
|
+
|
|
11
|
+
def __init__(self, video_id: str):
|
|
12
|
+
"""
|
|
13
|
+
Represents a YouTube video
|
|
14
|
+
|
|
15
|
+
Parameters
|
|
16
|
+
----------
|
|
17
|
+
video_id : str
|
|
18
|
+
The id or url of the video
|
|
19
|
+
"""
|
|
20
|
+
pattern = re.compile(r'.be/(.*?)$|=(.*?)$|^(\w{11})$') # noqa
|
|
21
|
+
match = pattern.search(video_id)
|
|
22
|
+
|
|
23
|
+
if not match:
|
|
24
|
+
raise ValueError('Invalid YouTube video ID or URL')
|
|
25
|
+
|
|
26
|
+
self._matched_id = (
|
|
27
|
+
match.group(1)
|
|
28
|
+
or match.group(2)
|
|
29
|
+
or match.group(3)
|
|
30
|
+
)
|
|
31
|
+
|
|
32
|
+
if self._matched_id:
|
|
33
|
+
self._url = self._HEAD + self._matched_id
|
|
34
|
+
self._video_data = video_data(self._matched_id)
|
|
35
|
+
# Extract basic info for fallback
|
|
36
|
+
title_match = re.search(r'<title>(.*?) - YouTube</title>', self._video_data)
|
|
37
|
+
self.title = title_match.group(1) if title_match else None
|
|
38
|
+
self.id = self._matched_id
|
|
39
|
+
else:
|
|
40
|
+
raise ValueError('Invalid YouTube video ID or URL')
|
|
41
|
+
|
|
42
|
+
def __repr__(self):
|
|
43
|
+
return f'<Video {self._url}>'
|
|
44
|
+
|
|
45
|
+
@property
|
|
46
|
+
def metadata(self) -> Dict[str, Any]:
|
|
47
|
+
"""
|
|
48
|
+
Fetches video metadata in a dict format
|
|
49
|
+
|
|
50
|
+
Returns
|
|
51
|
+
-------
|
|
52
|
+
Dict
|
|
53
|
+
Video metadata in a dict format containing keys: title, id, views, duration, author_id,
|
|
54
|
+
upload_date, url, thumbnails, tags, description, likes, genre, etc.
|
|
55
|
+
"""
|
|
56
|
+
# Multiple patterns to try for video details extraction for robustness
|
|
57
|
+
details_patterns = [
|
|
58
|
+
re.compile(r'videoDetails\":(.*?)\"isLiveContent\":.*?}'),
|
|
59
|
+
re.compile(r'videoDetails\":(.*?),\"playerConfig'),
|
|
60
|
+
re.compile(r'videoDetails\":(.*?),\"playabilityStatus')
|
|
61
|
+
]
|
|
62
|
+
|
|
63
|
+
# Other metadata patterns
|
|
64
|
+
upload_date_pattern = re.compile(r"<meta itemprop=\"uploadDate\" content=\"(.*?)\">")
|
|
65
|
+
genre_pattern = re.compile(r"<meta itemprop=\"genre\" content=\"(.*?)\">")
|
|
66
|
+
like_count_patterns = [
|
|
67
|
+
re.compile(r"iconType\":\"LIKE\"},\"defaultText\":(.*?)}"),
|
|
68
|
+
re.compile(r'\"likeCount\":\"(\d+)\"')
|
|
69
|
+
]
|
|
70
|
+
channel_name_pattern = re.compile(r'"ownerChannelName":"(.*?)"')
|
|
71
|
+
|
|
72
|
+
# Try each pattern for video details
|
|
73
|
+
raw_details_match = None
|
|
74
|
+
for pattern in details_patterns:
|
|
75
|
+
match = pattern.search(self._video_data)
|
|
76
|
+
if match:
|
|
77
|
+
raw_details_match = match
|
|
78
|
+
break
|
|
79
|
+
|
|
80
|
+
if not raw_details_match:
|
|
81
|
+
# Fallback metadata for search results or incomplete video data
|
|
82
|
+
return {
|
|
83
|
+
'title': getattr(self, 'title', None),
|
|
84
|
+
'id': getattr(self, 'id', None),
|
|
85
|
+
'views': getattr(self, 'views', None),
|
|
86
|
+
'streamed': False,
|
|
87
|
+
'duration': None,
|
|
88
|
+
'author_id': None,
|
|
89
|
+
'author_name': None,
|
|
90
|
+
'upload_date': None,
|
|
91
|
+
'url': f"https://www.youtube.com/watch?v={getattr(self, 'id', '')}" if hasattr(self, 'id') else None,
|
|
92
|
+
'thumbnails': None,
|
|
93
|
+
'tags': None,
|
|
94
|
+
'description': None,
|
|
95
|
+
'likes': None,
|
|
96
|
+
'genre': None,
|
|
97
|
+
'is_age_restricted': 'age-restricted' in self._video_data.lower(),
|
|
98
|
+
'is_unlisted': 'unlisted' in self._video_data.lower()
|
|
99
|
+
}
|
|
100
|
+
|
|
101
|
+
raw_details = raw_details_match.group(0)
|
|
102
|
+
|
|
103
|
+
# Extract upload date
|
|
104
|
+
upload_date_match = upload_date_pattern.search(self._video_data)
|
|
105
|
+
upload_date = upload_date_match.group(1) if upload_date_match else None
|
|
106
|
+
|
|
107
|
+
# Extract channel name
|
|
108
|
+
channel_name_match = channel_name_pattern.search(self._video_data)
|
|
109
|
+
channel_name = channel_name_match.group(1) if channel_name_match else None
|
|
110
|
+
|
|
111
|
+
# Parse video details
|
|
112
|
+
try:
|
|
113
|
+
# Clean up the JSON string for parsing
|
|
114
|
+
clean_json = raw_details.replace('videoDetails\":', '')
|
|
115
|
+
# Handle potential JSON parsing issues
|
|
116
|
+
if clean_json.endswith(','):
|
|
117
|
+
clean_json = clean_json[:-1]
|
|
118
|
+
metadata = json.loads(clean_json)
|
|
119
|
+
|
|
120
|
+
data = {
|
|
121
|
+
'title': metadata.get('title'),
|
|
122
|
+
'id': metadata.get('videoId', self._matched_id),
|
|
123
|
+
'views': metadata.get('viewCount'),
|
|
124
|
+
'streamed': metadata.get('isLiveContent', False),
|
|
125
|
+
'duration': metadata.get('lengthSeconds'),
|
|
126
|
+
'author_id': metadata.get('channelId'),
|
|
127
|
+
'author_name': channel_name or metadata.get('author'),
|
|
128
|
+
'upload_date': upload_date,
|
|
129
|
+
'url': f"https://www.youtube.com/watch?v={metadata.get('videoId', self._matched_id)}",
|
|
130
|
+
'thumbnails': metadata.get('thumbnail', {}).get('thumbnails'),
|
|
131
|
+
'tags': metadata.get('keywords'),
|
|
132
|
+
'description': metadata.get('shortDescription'),
|
|
133
|
+
'is_age_restricted': metadata.get('isAgeRestricted', False) or 'age-restricted' in self._video_data.lower(),
|
|
134
|
+
'is_unlisted': 'unlisted' in self._video_data.lower(),
|
|
135
|
+
'is_family_safe': metadata.get('isFamilySafe', True),
|
|
136
|
+
'is_private': metadata.get('isPrivate', False),
|
|
137
|
+
'is_live_content': metadata.get('isLiveContent', False),
|
|
138
|
+
'is_crawlable': metadata.get('isCrawlable', True),
|
|
139
|
+
'allow_ratings': metadata.get('allowRatings', True)
|
|
140
|
+
}
|
|
141
|
+
except (json.JSONDecodeError, KeyError, TypeError) as e:
|
|
142
|
+
# Fallback to basic metadata if JSON parsing fails
|
|
143
|
+
return {
|
|
144
|
+
'title': getattr(self, 'title', None),
|
|
145
|
+
'id': self._matched_id,
|
|
146
|
+
'url': self._url,
|
|
147
|
+
'error': f"Failed to parse video details: {str(e)}"
|
|
148
|
+
}
|
|
149
|
+
|
|
150
|
+
# Try to extract likes count
|
|
151
|
+
likes = None
|
|
152
|
+
for pattern in like_count_patterns:
|
|
153
|
+
try:
|
|
154
|
+
likes_match = pattern.search(self._video_data)
|
|
155
|
+
if likes_match:
|
|
156
|
+
likes_text = likes_match.group(1)
|
|
157
|
+
# Handle different formats of like count
|
|
158
|
+
if '{' in likes_text:
|
|
159
|
+
likes = json.loads(likes_text + '}}}')['accessibility']['accessibilityData']['label'].split(' ')[0].replace(',', '')
|
|
160
|
+
else:
|
|
161
|
+
likes = likes_text
|
|
162
|
+
break
|
|
163
|
+
except (AttributeError, KeyError, json.decoder.JSONDecodeError):
|
|
164
|
+
continue
|
|
165
|
+
|
|
166
|
+
data['likes'] = likes
|
|
167
|
+
|
|
168
|
+
# Try to extract genre
|
|
169
|
+
try:
|
|
170
|
+
genre_match = genre_pattern.search(self._video_data)
|
|
171
|
+
data['genre'] = genre_match.group(1) if genre_match else None
|
|
172
|
+
except AttributeError:
|
|
173
|
+
data['genre'] = None
|
|
174
|
+
|
|
175
|
+
return data
|
|
176
|
+
|
|
177
|
+
|
|
178
|
+
|
|
179
|
+
@property
|
|
180
|
+
def embed_html(self) -> str:
|
|
181
|
+
"""
|
|
182
|
+
Get the embed HTML code for this video
|
|
183
|
+
|
|
184
|
+
Returns:
|
|
185
|
+
HTML iframe code for embedding the video
|
|
186
|
+
"""
|
|
187
|
+
return f'<iframe width="560" height="315" src="https://www.youtube.com/embed/{self._matched_id}" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>'
|
|
188
|
+
|
|
189
|
+
@property
|
|
190
|
+
def embed_url(self) -> str:
|
|
191
|
+
"""
|
|
192
|
+
Get the embed URL for this video
|
|
193
|
+
|
|
194
|
+
Returns:
|
|
195
|
+
URL for embedding the video
|
|
196
|
+
"""
|
|
197
|
+
return f'https://www.youtube.com/embed/{self._matched_id}'
|
|
198
|
+
|
|
199
|
+
@property
|
|
200
|
+
def thumbnail_url(self) -> str:
|
|
201
|
+
"""
|
|
202
|
+
Get the thumbnail URL for this video
|
|
203
|
+
|
|
204
|
+
Returns:
|
|
205
|
+
URL of the video thumbnail (high quality)
|
|
206
|
+
"""
|
|
207
|
+
return f'https://i.ytimg.com/vi/{self._matched_id}/hqdefault.jpg'
|
|
208
|
+
|
|
209
|
+
@property
|
|
210
|
+
def thumbnail_urls(self) -> Dict[str, str]:
|
|
211
|
+
"""
|
|
212
|
+
Get all thumbnail URLs for this video in different qualities
|
|
213
|
+
|
|
214
|
+
Returns:
|
|
215
|
+
Dictionary of thumbnail URLs with quality labels
|
|
216
|
+
"""
|
|
217
|
+
return {
|
|
218
|
+
'default': f'https://i.ytimg.com/vi/{self._matched_id}/default.jpg',
|
|
219
|
+
'medium': f'https://i.ytimg.com/vi/{self._matched_id}/mqdefault.jpg',
|
|
220
|
+
'high': f'https://i.ytimg.com/vi/{self._matched_id}/hqdefault.jpg',
|
|
221
|
+
'standard': f'https://i.ytimg.com/vi/{self._matched_id}/sddefault.jpg',
|
|
222
|
+
'maxres': f'https://i.ytimg.com/vi/{self._matched_id}/maxresdefault.jpg'
|
|
223
|
+
}
|
|
224
|
+
|
|
225
|
+
if __name__ == '__main__':
|
|
226
|
+
video = Video('https://www.youtube.com/watch?v=9bZkp7q19f0')
|
|
227
|
+
print(video.metadata)
|
|
228
|
+
|
|
229
|
+
# Example of getting comments
|
|
230
|
+
print("\nFirst 3 comments:")
|
|
231
|
+
for i, comment in enumerate(video.stream_comments(3), 1):
|
|
232
|
+
print(f"{i}. {comment['author']}: {comment['text'][:50]}...")
|
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
"""
|
|
2
|
-
AutoCoder Module - Part of Webscout
|
|
3
|
-
Provides automated code generation and manipulation capabilities.
|
|
4
|
-
"""
|
|
5
|
-
|
|
6
|
-
from .autocoder import *
|
|
7
|
-
from .autocoder_utiles import *
|
|
8
|
-
|
|
9
|
-
# __all__ = [] # Add your public module names here
|
|
1
|
+
"""
|
|
2
|
+
AutoCoder Module - Part of Webscout
|
|
3
|
+
Provides automated code generation and manipulation capabilities.
|
|
4
|
+
"""
|
|
5
|
+
|
|
6
|
+
from .autocoder import *
|
|
7
|
+
from .autocoder_utiles import *
|
|
8
|
+
|
|
9
|
+
# __all__ = [] # Add your public module names here
|