webscout 6.4__py3-none-any.whl → 6.6__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of webscout might be problematic. Click here for more details.

Files changed (116) hide show
  1. webscout/AIutel.py +7 -54
  2. webscout/DWEBS.py +48 -26
  3. webscout/{YTdownloader.py → Extra/YTToolkit/YTdownloader.py} +990 -1103
  4. webscout/Extra/YTToolkit/__init__.py +3 -0
  5. webscout/{transcriber.py → Extra/YTToolkit/transcriber.py} +1 -1
  6. webscout/Extra/YTToolkit/ytapi/__init__.py +6 -0
  7. webscout/Extra/YTToolkit/ytapi/channel.py +307 -0
  8. webscout/Extra/YTToolkit/ytapi/errors.py +13 -0
  9. webscout/Extra/YTToolkit/ytapi/extras.py +45 -0
  10. webscout/Extra/YTToolkit/ytapi/https.py +88 -0
  11. webscout/Extra/YTToolkit/ytapi/patterns.py +61 -0
  12. webscout/Extra/YTToolkit/ytapi/playlist.py +59 -0
  13. webscout/Extra/YTToolkit/ytapi/pool.py +8 -0
  14. webscout/Extra/YTToolkit/ytapi/query.py +37 -0
  15. webscout/Extra/YTToolkit/ytapi/stream.py +60 -0
  16. webscout/Extra/YTToolkit/ytapi/utils.py +62 -0
  17. webscout/Extra/YTToolkit/ytapi/video.py +102 -0
  18. webscout/Extra/__init__.py +2 -1
  19. webscout/Extra/autocoder/autocoder_utiles.py +119 -101
  20. webscout/Extra/autocoder/rawdog.py +679 -680
  21. webscout/Extra/gguf.py +441 -441
  22. webscout/Extra/markdownlite/__init__.py +862 -0
  23. webscout/Extra/weather_ascii.py +2 -2
  24. webscout/Provider/AISEARCH/__init__.py +2 -0
  25. webscout/Provider/AISEARCH/ooai.py +155 -0
  26. webscout/Provider/Amigo.py +70 -85
  27. webscout/Provider/{prefind.py → Jadve.py} +72 -70
  28. webscout/Provider/Netwrck.py +235 -0
  29. webscout/Provider/Openai.py +4 -3
  30. webscout/Provider/PI.py +292 -221
  31. webscout/Provider/PizzaGPT.py +3 -3
  32. webscout/Provider/Reka.py +0 -1
  33. webscout/Provider/TTS/__init__.py +5 -1
  34. webscout/Provider/TTS/deepgram.py +183 -0
  35. webscout/Provider/TTS/elevenlabs.py +137 -0
  36. webscout/Provider/TTS/gesserit.py +151 -0
  37. webscout/Provider/TTS/murfai.py +139 -0
  38. webscout/Provider/TTS/parler.py +134 -107
  39. webscout/Provider/TTS/streamElements.py +360 -275
  40. webscout/Provider/TTS/utils.py +280 -0
  41. webscout/Provider/TTS/voicepod.py +116 -116
  42. webscout/Provider/TeachAnything.py +15 -2
  43. webscout/Provider/Youchat.py +42 -8
  44. webscout/Provider/__init__.py +8 -21
  45. webscout/Provider/meta.py +794 -779
  46. webscout/Provider/multichat.py +230 -0
  47. webscout/Provider/promptrefine.py +2 -2
  48. webscout/Provider/talkai.py +10 -13
  49. webscout/Provider/turboseek.py +5 -4
  50. webscout/Provider/tutorai.py +8 -112
  51. webscout/Provider/typegpt.py +5 -7
  52. webscout/Provider/x0gpt.py +81 -9
  53. webscout/Provider/yep.py +123 -361
  54. webscout/__init__.py +33 -28
  55. webscout/conversation.py +24 -9
  56. webscout/exceptions.py +188 -20
  57. webscout/litprinter/__init__.py +719 -831
  58. webscout/litprinter/colors.py +54 -0
  59. webscout/optimizers.py +420 -270
  60. webscout/prompt_manager.py +279 -279
  61. webscout/scout/__init__.py +8 -0
  62. webscout/scout/core/__init__.py +7 -0
  63. webscout/scout/core/crawler.py +140 -0
  64. webscout/scout/core/scout.py +571 -0
  65. webscout/scout/core/search_result.py +96 -0
  66. webscout/scout/core/text_analyzer.py +63 -0
  67. webscout/scout/core/text_utils.py +277 -0
  68. webscout/scout/core/web_analyzer.py +52 -0
  69. webscout/scout/core.py +884 -0
  70. webscout/scout/element.py +460 -0
  71. webscout/scout/parsers/__init__.py +69 -0
  72. webscout/scout/parsers/html5lib_parser.py +172 -0
  73. webscout/scout/parsers/html_parser.py +236 -0
  74. webscout/scout/parsers/lxml_parser.py +178 -0
  75. webscout/scout/utils.py +38 -0
  76. webscout/update_checker.py +184 -125
  77. webscout/version.py +1 -1
  78. webscout/zeroart/__init__.py +55 -0
  79. webscout/zeroart/base.py +60 -0
  80. webscout/zeroart/effects.py +99 -0
  81. webscout/zeroart/fonts.py +816 -0
  82. webscout/zerodir/__init__.py +225 -0
  83. {webscout-6.4.dist-info → webscout-6.6.dist-info}/METADATA +18 -231
  84. webscout-6.6.dist-info/RECORD +197 -0
  85. webscout-6.6.dist-info/top_level.txt +2 -0
  86. webstoken/__init__.py +30 -0
  87. webstoken/classifier.py +189 -0
  88. webstoken/keywords.py +216 -0
  89. webstoken/language.py +128 -0
  90. webstoken/ner.py +164 -0
  91. webstoken/normalizer.py +35 -0
  92. webstoken/processor.py +77 -0
  93. webstoken/sentiment.py +206 -0
  94. webstoken/stemmer.py +73 -0
  95. webstoken/t.py +75 -0
  96. webstoken/tagger.py +60 -0
  97. webstoken/tokenizer.py +158 -0
  98. webscout/Agents/Onlinesearcher.py +0 -182
  99. webscout/Agents/__init__.py +0 -2
  100. webscout/Agents/functioncall.py +0 -248
  101. webscout/Bing_search.py +0 -251
  102. webscout/Provider/Perplexity.py +0 -599
  103. webscout/Provider/RoboCoders.py +0 -206
  104. webscout/Provider/genspark.py +0 -225
  105. webscout/Provider/perplexitylabs.py +0 -265
  106. webscout/Provider/twitterclone.py +0 -251
  107. webscout/Provider/upstage.py +0 -230
  108. webscout/gpt4free.py +0 -666
  109. webscout/requestsHTMLfix.py +0 -775
  110. webscout/webai.py +0 -2590
  111. webscout-6.4.dist-info/RECORD +0 -154
  112. webscout-6.4.dist-info/top_level.txt +0 -1
  113. /webscout/Provider/{felo_search.py → AISEARCH/felo_search.py} +0 -0
  114. {webscout-6.4.dist-info → webscout-6.6.dist-info}/LICENSE.md +0 -0
  115. {webscout-6.4.dist-info → webscout-6.6.dist-info}/WHEEL +0 -0
  116. {webscout-6.4.dist-info → webscout-6.6.dist-info}/entry_points.txt +0 -0
webscout/Provider/meta.py CHANGED
@@ -1,779 +1,794 @@
1
- import json
2
- import logging
3
- import time
4
- import urllib
5
- import uuid
6
- from typing import Dict, Generator, Iterator, List, Union
7
-
8
- import random
9
-
10
-
11
- from webscout.requestsHTMLfix import HTMLSession
12
- import requests
13
- from bs4 import BeautifulSoup
14
-
15
- import requests
16
-
17
-
18
- from webscout.AIutel import Optimizers
19
- from webscout.AIutel import Conversation
20
- from webscout.AIutel import AwesomePrompts, sanitize_stream
21
- from webscout.AIbase import Provider
22
- from webscout import exceptions
23
-
24
- MAX_RETRIES = 3
25
-
26
- def generate_offline_threading_id() -> str:
27
- """
28
- Generates an offline threading ID.
29
-
30
- Returns:
31
- str: The generated offline threading ID.
32
- """
33
- # Maximum value for a 64-bit integer in Python
34
- max_int = (1 << 64) - 1
35
- mask22_bits = (1 << 22) - 1
36
-
37
- # Function to get the current timestamp in milliseconds
38
- def get_current_timestamp():
39
- return int(time.time() * 1000)
40
-
41
- # Function to generate a random 64-bit integer
42
- def get_random_64bit_int():
43
- return random.getrandbits(64)
44
-
45
- # Combine timestamp and random value
46
- def combine_and_mask(timestamp, random_value):
47
- shifted_timestamp = timestamp << 22
48
- masked_random = random_value & mask22_bits
49
- return (shifted_timestamp | masked_random) & max_int
50
-
51
- timestamp = get_current_timestamp()
52
- random_value = get_random_64bit_int()
53
- threading_id = combine_and_mask(timestamp, random_value)
54
-
55
- return str(threading_id)
56
-
57
-
58
- def extract_value(text: str, start_str: str, end_str: str) -> str:
59
- """
60
- Helper function to extract a specific value from the given text using a key.
61
-
62
- Args:
63
- text (str): The text from which to extract the value.
64
- start_str (str): The starting key.
65
- end_str (str): The ending key.
66
-
67
- Returns:
68
- str: The extracted value.
69
- """
70
- start = text.find(start_str) + len(start_str)
71
- end = text.find(end_str, start)
72
- return text[start:end]
73
-
74
-
75
- def format_response(response: dict) -> str:
76
- """
77
- Formats the response from Meta AI to remove unnecessary characters.
78
-
79
- Args:
80
- response (dict): The dictionnary containing the response to format.
81
-
82
- Returns:
83
- str: The formatted response.
84
- """
85
- text = ""
86
- for content in (
87
- response.get("data", {})
88
- .get("node", {})
89
- .get("bot_response_message", {})
90
- .get("composed_text", {})
91
- .get("content", [])
92
- ):
93
- text += content["text"] + "\n"
94
- return text
95
-
96
-
97
- # Function to perform the login
98
- def get_fb_session(email, password, proxies=None):
99
- login_url = "https://mbasic.facebook.com/login/"
100
- headers = {
101
- "authority": "mbasic.facebook.com",
102
- "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
103
- "accept-language": "en-US,en;q=0.9",
104
- "sec-ch-ua": '"Chromium";v="122", "Not(A:Brand";v="24", "Google Chrome";v="122"',
105
- "sec-ch-ua-mobile": "?0",
106
- "sec-ch-ua-platform": '"macOS"',
107
- "sec-fetch-dest": "document",
108
- "sec-fetch-mode": "navigate",
109
- "sec-fetch-site": "none",
110
- "sec-fetch-user": "?1",
111
- "upgrade-insecure-requests": "1",
112
- "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
113
- }
114
- # Send the GET request
115
- response = requests.get(login_url, headers=headers, proxies=proxies)
116
- soup = BeautifulSoup(response.text, "html.parser")
117
-
118
- # Parse necessary parameters from the login form
119
- lsd = soup.find("input", {"name": "lsd"})["value"]
120
- jazoest = soup.find("input", {"name": "jazoest"})["value"]
121
- li = soup.find("input", {"name": "li"})["value"]
122
- m_ts = soup.find("input", {"name": "m_ts"})["value"]
123
-
124
- # Define the URL and body for the POST request to submit the login form
125
- post_url = "https://mbasic.facebook.com/login/device-based/regular/login/?refsrc=deprecated&lwv=100"
126
- data = {
127
- "lsd": lsd,
128
- "jazoest": jazoest,
129
- "m_ts": m_ts,
130
- "li": li,
131
- "try_number": "0",
132
- "unrecognized_tries": "0",
133
- "email": email,
134
- "pass": password,
135
- "login": "Log In",
136
- "bi_xrwh": "0",
137
- }
138
-
139
- headers = {
140
- "authority": "mbasic.facebook.com",
141
- "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
142
- "accept-language": "en-US,en;q=0.9",
143
- "cache-control": "no-cache",
144
- "content-type": "application/x-www-form-urlencoded",
145
- "cookie": f"datr={response.cookies.get('datr')}; sb={response.cookies.get('sb')}; ps_n=1; ps_l=1",
146
- "dpr": "2",
147
- "origin": "https://mbasic.facebook.com",
148
- "pragma": "no-cache",
149
- "referer": "https://mbasic.facebook.com/login/",
150
- "sec-fetch-site": "same-origin",
151
- "sec-fetch-user": "?1",
152
- "upgrade-insecure-requests": "1",
153
- "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
154
- "viewport-width": "1728",
155
- }
156
-
157
- # Send the POST request
158
- session = requests.session()
159
- session.proxies = proxies
160
-
161
- result = session.post(post_url, headers=headers, data=data)
162
- if "sb" not in session.cookies:
163
- raise exceptions.FacebookInvalidCredentialsException(
164
- "Was not able to login to Facebook. Please check your credentials. "
165
- "You may also have been rate limited. Try to connect to Facebook manually."
166
- )
167
-
168
- cookies = {
169
- **result.cookies.get_dict(),
170
- "sb": session.cookies["sb"],
171
- "xs": session.cookies["xs"],
172
- "fr": session.cookies["fr"],
173
- "c_user": session.cookies["c_user"],
174
- }
175
-
176
- response_login = {
177
- "cookies": cookies,
178
- "headers": result.headers,
179
- "response": response.text,
180
- }
181
- meta_ai_cookies = get_cookies()
182
-
183
- url = "https://www.meta.ai/state/"
184
-
185
- payload = f'__a=1&lsd={meta_ai_cookies["lsd"]}'
186
- headers = {
187
- "authority": "www.meta.ai",
188
- "accept": "*/*",
189
- "accept-language": "en-US,en;q=0.9",
190
- "cache-control": "no-cache",
191
- "content-type": "application/x-www-form-urlencoded",
192
- "cookie": f'ps_n=1; ps_l=1; dpr=2; _js_datr={meta_ai_cookies["_js_datr"]}; abra_csrf={meta_ai_cookies["abra_csrf"]}; datr={meta_ai_cookies["datr"]};; ps_l=1; ps_n=1',
193
- "origin": "https://www.meta.ai",
194
- "pragma": "no-cache",
195
- "referer": "https://www.meta.ai/",
196
- "sec-fetch-mode": "cors",
197
- "sec-fetch-site": "same-origin",
198
- "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
199
- }
200
-
201
- response = requests.request("POST", url, headers=headers, data=payload, proxies=proxies)
202
-
203
- state = extract_value(response.text, start_str='"state":"', end_str='"')
204
-
205
- url = f"https://www.facebook.com/oidc/?app_id=1358015658191005&scope=openid%20linking&response_type=code&redirect_uri=https%3A%2F%2Fwww.meta.ai%2Fauth%2F&no_universal_links=1&deoia=1&state={state}"
206
- payload = {}
207
- headers = {
208
- "authority": "www.facebook.com",
209
- "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
210
- "accept-language": "en-US,en;q=0.9",
211
- "cache-control": "no-cache",
212
- "cookie": f"datr={response_login['cookies']['datr']}; sb={response_login['cookies']['sb']}; c_user={response_login['cookies']['c_user']}; xs={response_login['cookies']['xs']}; fr={response_login['cookies']['fr']}; m_page_voice={response_login['cookies']['m_page_voice']}; abra_csrf={meta_ai_cookies['abra_csrf']};",
213
- "sec-fetch-dest": "document",
214
- "sec-fetch-mode": "navigate",
215
- "sec-fetch-site": "cross-site",
216
- "sec-fetch-user": "?1",
217
- "upgrade-insecure-requests": "1",
218
- "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
219
- }
220
- session = requests.session()
221
- session.proxies = proxies
222
- response = session.get(url, headers=headers, data=payload, allow_redirects=False)
223
-
224
- next_url = response.headers["Location"]
225
-
226
- url = next_url
227
-
228
- payload = {}
229
- headers = {
230
- "User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10.15; rv:125.0) Gecko/20100101 Firefox/125.0",
231
- "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8",
232
- "Accept-Language": "en-US,en;q=0.5",
233
- "Accept-Encoding": "gzip, deflate, br",
234
- "Referer": "https://www.meta.ai/",
235
- "Connection": "keep-alive",
236
- "Cookie": f'dpr=2; abra_csrf={meta_ai_cookies["abra_csrf"]}; datr={meta_ai_cookies["_js_datr"]}',
237
- "Upgrade-Insecure-Requests": "1",
238
- "Sec-Fetch-Dest": "document",
239
- "Sec-Fetch-Mode": "navigate",
240
- "Sec-Fetch-Site": "cross-site",
241
- "Sec-Fetch-User": "?1",
242
- "TE": "trailers",
243
- }
244
- session.get(url, headers=headers, data=payload)
245
- cookies = session.cookies.get_dict()
246
- if "abra_sess" not in cookies:
247
- raise exceptions.FacebookInvalidCredentialsException(
248
- "Was not able to login to Facebook. Please check your credentials. "
249
- "You may also have been rate limited. Try to connect to Facebook manually."
250
- )
251
- logging.info("Successfully logged in to Facebook.")
252
- return cookies
253
-
254
-
255
- def get_cookies() -> dict:
256
- """
257
- Extracts necessary cookies from the Meta AI main page.
258
-
259
- Returns:
260
- dict: A dictionary containing essential cookies.
261
- """
262
- session = HTMLSession()
263
- response = session.get("https://www.meta.ai/")
264
- return {
265
- "_js_datr": extract_value(
266
- response.text, start_str='_js_datr":{"value":"', end_str='",'
267
- ),
268
- "abra_csrf": extract_value(
269
- response.text, start_str='abra_csrf":{"value":"', end_str='",'
270
- ),
271
- "datr": extract_value(
272
- response.text, start_str='datr":{"value":"', end_str='",'
273
- ),
274
- "lsd": extract_value(
275
- response.text, start_str='"LSD",[],{"token":"', end_str='"}'
276
- ),
277
- }
278
- class Meta(Provider):
279
- """
280
- A class to interact with the Meta AI API to obtain and use access tokens for sending
281
- and receiving messages from the Meta AI Chat API.
282
- """
283
-
284
- def __init__(
285
- self,
286
- fb_email: str = None,
287
- fb_password: str = None,
288
- proxy: dict = None,
289
- is_conversation: bool = True,
290
- max_tokens: int = 600,
291
- timeout: int = 30,
292
- intro: str = None,
293
- filepath: str = None,
294
- update_file: bool = True,
295
- proxies: dict = {},
296
- history_offset: int = 10250,
297
- act: str = None,
298
- ):
299
- """
300
- Initializes the Meta AI API with given parameters.
301
-
302
- Args:
303
- fb_email (str, optional): Your Facebook email address. Defaults to None.
304
- fb_password (str, optional): Your Facebook password. Defaults to None.
305
- proxy (dict, optional): Proxy settings for requests. Defaults to None.
306
- is_conversation (bool, optional): Flag for chatting conversationally. Defaults to True.
307
- max_tokens (int, optional): Maximum number of tokens to be generated upon completion. Defaults to 600.
308
- timeout (int, optional): Http request timeout. Defaults to 30.
309
- intro (str, optional): Conversation introductory prompt. Defaults to None.
310
- filepath (str, optional): Path to file containing conversation history. Defaults to None.
311
- update_file (bool, optional): Add new prompts and responses to the file. Defaults to True.
312
- proxies (dict, optional): Http request proxies. Defaults to {}.
313
- history_offset (int, optional): Limit conversation history to this number of last texts. Defaults to 10250.
314
- act (str|int, optional): Awesome prompt key or index. (Used as intro). Defaults to None.
315
- """
316
- self.session = requests.Session()
317
- self.session.headers.update(
318
- {
319
- "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 "
320
- "(KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
321
- }
322
- )
323
- self.access_token = None
324
- self.fb_email = fb_email
325
- self.fb_password = fb_password
326
- self.proxy = proxy
327
- if self.proxy and not self.check_proxy():
328
- raise ConnectionError(
329
- "Unable to connect to proxy. Please check your proxy settings."
330
- )
331
- self.is_conversation = is_conversation
332
- self.max_tokens_to_sample = max_tokens
333
- self.timeout = timeout
334
- self.last_response = {}
335
- self.is_authed = fb_password is not None and fb_email is not None
336
- self.cookies = self.get_cookies()
337
- self.external_conversation_id = None
338
- self.offline_threading_id = None
339
-
340
- self.__available_optimizers = (
341
- method
342
- for method in dir(Optimizers)
343
- if callable(getattr(Optimizers, method)) and not method.startswith("__")
344
- )
345
- Conversation.intro = (
346
- AwesomePrompts().get_act(
347
- act, raise_not_found=True, default=None, case_insensitive=True
348
- )
349
- if act
350
- else intro or Conversation.intro
351
- )
352
- self.conversation = Conversation(
353
- is_conversation, self.max_tokens_to_sample, filepath, update_file
354
- )
355
- self.conversation.history_offset = history_offset
356
- self.session.proxies = proxies
357
-
358
- def check_proxy(self, test_url: str = "https://api.ipify.org/?format=json") -> bool:
359
- """
360
- Checks the proxy connection by making a request to a test URL.
361
-
362
- Args:
363
- test_url (str): A test site from which we check that the proxy is installed correctly.
364
-
365
- Returns:
366
- bool: True if the proxy is working, False otherwise.
367
- """
368
- try:
369
- response = self.session.get(test_url, proxies=self.proxy, timeout=10)
370
- if response.status_code == 200:
371
- self.session.proxies = self.proxy
372
- return True
373
- return False
374
- except requests.RequestException:
375
- return False
376
-
377
- def get_access_token(self) -> str:
378
- """
379
- Retrieves an access token using Meta's authentication API.
380
-
381
- Returns:
382
- str: A valid access token.
383
- """
384
-
385
- if self.access_token:
386
- return self.access_token
387
-
388
- url = "https://www.meta.ai/api/graphql/"
389
- payload = {
390
- "lsd": self.cookies["lsd"],
391
- "fb_api_caller_class": "RelayModern",
392
- "fb_api_req_friendly_name": "useAbraAcceptTOSForTempUserMutation",
393
- "variables": {
394
- "dob": "1999-01-01",
395
- "icebreaker_type": "TEXT",
396
- "__relay_internal__pv__WebPixelRatiorelayprovider": 1,
397
- },
398
- "doc_id": "7604648749596940",
399
- }
400
- payload = urllib.parse.urlencode(payload) # noqa
401
- headers = {
402
- "content-type": "application/x-www-form-urlencoded",
403
- "cookie": f'_js_datr={self.cookies["_js_datr"]}; '
404
- f'abra_csrf={self.cookies["abra_csrf"]}; datr={self.cookies["datr"]};',
405
- "sec-fetch-site": "same-origin",
406
- "x-fb-friendly-name": "useAbraAcceptTOSForTempUserMutation",
407
- }
408
-
409
- response = self.session.post(url, headers=headers, data=payload)
410
-
411
- try:
412
- auth_json = response.json()
413
- except json.JSONDecodeError:
414
- raise exceptions.FacebookRegionBlocked(
415
- "Unable to receive a valid response from Meta AI. This is likely due to your region being blocked. "
416
- "Try manually accessing https://www.meta.ai/ to confirm."
417
- )
418
-
419
- access_token = auth_json["data"]["xab_abra_accept_terms_of_service"][
420
- "new_temp_user_auth"
421
- ]["access_token"]
422
-
423
- # Need to sleep for a bit, for some reason the API doesn't like it when we send request too quickly
424
- # (maybe Meta needs to register Cookies on their side?)
425
- time.sleep(1)
426
-
427
- return access_token
428
-
429
- def ask(
430
- self,
431
- prompt: str,
432
- stream: bool = False,
433
- raw: bool = False,
434
- optimizer: str = None,
435
- conversationally: bool = False,
436
- ) -> Union[Dict, Generator[Dict, None, None]]:
437
- """
438
- Sends a message to the Meta AI and returns the response.
439
-
440
- Args:
441
- prompt (str): The prompt to send.
442
- stream (bool): Whether to stream the response or not. Defaults to False.
443
- raw (bool, optional): Stream back raw response as received. Defaults to False.
444
- optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
445
- conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
446
- Returns:
447
- Union[Dict, Generator[Dict, None, None]]: A dictionary containing the response message and sources, or a generator yielding such dictionaries.
448
- """
449
- conversation_prompt = self.conversation.gen_complete_prompt(prompt)
450
- if optimizer:
451
- if optimizer in self.__available_optimizers:
452
- conversation_prompt = getattr(Optimizers, optimizer)(
453
- conversation_prompt if conversationally else prompt
454
- )
455
- else:
456
- raise Exception(
457
- f"Optimizer is not one of {self.__available_optimizers}"
458
- )
459
-
460
- if not self.is_authed:
461
- self.access_token = self.get_access_token()
462
- auth_payload = {"access_token": self.access_token}
463
- url = "https://graph.meta.ai/graphql?locale=user"
464
-
465
- else:
466
- auth_payload = {"fb_dtsg": self.cookies["fb_dtsg"]}
467
- url = "https://www.meta.ai/api/graphql/"
468
-
469
- if not self.external_conversation_id:
470
- external_id = str(uuid.uuid4())
471
- self.external_conversation_id = external_id
472
- payload = {
473
- **auth_payload,
474
- "fb_api_caller_class": "RelayModern",
475
- "fb_api_req_friendly_name": "useAbraSendMessageMutation",
476
- "variables": json.dumps(
477
- {
478
- "message": {"sensitive_string_value": conversation_prompt},
479
- "externalConversationId": self.external_conversation_id,
480
- "offlineThreadingId": generate_offline_threading_id(),
481
- "suggestedPromptIndex": None,
482
- "flashVideoRecapInput": {"images": []},
483
- "flashPreviewInput": None,
484
- "promptPrefix": None,
485
- "entrypoint": "ABRA__CHAT__TEXT",
486
- "icebreaker_type": "TEXT",
487
- "__relay_internal__pv__AbraDebugDevOnlyrelayprovider": False,
488
- "__relay_internal__pv__WebPixelRatiorelayprovider": 1,
489
- }
490
- ),
491
- "server_timestamps": "true",
492
- "doc_id": "7783822248314888",
493
- }
494
- payload = urllib.parse.urlencode(payload) # noqa
495
- headers = {
496
- "content-type": "application/x-www-form-urlencoded",
497
- "x-fb-friendly-name": "useAbraSendMessageMutation",
498
- }
499
- if self.is_authed:
500
- headers["cookie"] = f'abra_sess={self.cookies["abra_sess"]}'
501
- # Recreate the session to avoid cookie leakage when user is authenticated
502
- self.session = requests.Session()
503
- self.session.proxies = self.proxy
504
-
505
- if stream:
506
-
507
- def for_stream():
508
- response = self.session.post(
509
- url, headers=headers, data=payload, stream=True, timeout=self.timeout
510
- )
511
- if not response.ok:
512
- raise exceptions.FailedToGenerateResponseError(
513
- f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
514
- )
515
-
516
- lines = response.iter_lines()
517
- is_error = json.loads(next(lines))
518
- if len(is_error.get("errors", [])) > 0:
519
- raise exceptions.FailedToGenerateResponseError(
520
- f"Failed to generate response - {response.text}"
521
- )
522
- for line in lines:
523
- if line:
524
- json_line = json.loads(line)
525
- extracted_data = self.extract_data(json_line)
526
- if not extracted_data.get("message"):
527
- continue
528
- self.last_response.update(extracted_data)
529
- yield line if raw else extracted_data
530
- self.conversation.update_chat_history(
531
- prompt, self.get_message(self.last_response)
532
- )
533
-
534
- return for_stream()
535
- else:
536
- response = self.session.post(
537
- url, headers=headers, data=payload, timeout=self.timeout
538
- )
539
- if not response.ok:
540
- raise exceptions.FailedToGenerateResponseError(
541
- f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
542
- )
543
- raw_response = response.text
544
- last_streamed_response = self.extract_last_response(raw_response)
545
- if not last_streamed_response:
546
- raise exceptions.FailedToGenerateResponseError(
547
- f"Failed to generate response - {response.text}"
548
- )
549
-
550
- extracted_data = self.extract_data(last_streamed_response)
551
- self.last_response.update(extracted_data)
552
- self.conversation.update_chat_history(
553
- prompt, self.get_message(self.last_response)
554
- )
555
- return extracted_data
556
-
557
- def chat(
558
- self,
559
- prompt: str,
560
- stream: bool = False,
561
- optimizer: str = None,
562
- conversationally: bool = False,
563
- ) -> str:
564
- """
565
- Sends a message to the Meta AI and returns the response.
566
-
567
- Args:
568
- prompt (str): The message to send.
569
- stream (bool): Whether to stream the response or not. Defaults to False.
570
- optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
571
- conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
572
-
573
- Returns:
574
- str: The response message.
575
- """
576
-
577
- def for_stream():
578
- for response in self.ask(
579
- prompt, True, optimizer=optimizer, conversationally=conversationally
580
- ):
581
- yield self.get_message(response)
582
-
583
- def for_non_stream():
584
- return self.get_message(
585
- self.ask(
586
- prompt,
587
- False,
588
- optimizer=optimizer,
589
- conversationally=conversationally,
590
- )
591
- )
592
-
593
- return for_stream() if stream else for_non_stream()
594
-
595
- def extract_last_response(self, response: str) -> Dict:
596
- """
597
- Extracts the last response from the Meta AI API.
598
-
599
- Args:
600
- response (str): The response to extract the last response from.
601
-
602
- Returns:
603
- dict: A dictionary containing the last response.
604
- """
605
- last_streamed_response = None
606
- for line in response.split("\n"):
607
- try:
608
- json_line = json.loads(line)
609
- except json.JSONDecodeError:
610
- continue
611
-
612
- bot_response_message = (
613
- json_line.get("data", {})
614
- .get("node", {})
615
- .get("bot_response_message", {})
616
- )
617
- chat_id = bot_response_message.get("id")
618
- if chat_id:
619
- external_conversation_id, offline_threading_id, _ = chat_id.split("_")
620
- self.external_conversation_id = external_conversation_id
621
- self.offline_threading_id = offline_threading_id
622
-
623
- streaming_state = bot_response_message.get("streaming_state")
624
- if streaming_state == "OVERALL_DONE":
625
- last_streamed_response = json_line
626
-
627
- return last_streamed_response
628
-
629
- def extract_data(self, json_line: dict) -> Dict:
630
- """
631
- Extract data and sources from a parsed JSON line.
632
-
633
- Args:
634
- json_line (dict): Parsed JSON line.
635
-
636
- Returns:
637
- dict: A dictionary containing the response message, sources, and media.
638
- """
639
- bot_response_message = (
640
- json_line.get("data", {}).get("node", {}).get("bot_response_message", {})
641
- )
642
- response = format_response(response=json_line)
643
- fetch_id = bot_response_message.get("fetch_id")
644
- sources = self.fetch_sources(fetch_id) if fetch_id else []
645
- medias = self.extract_media(bot_response_message)
646
- return {"message": response, "sources": sources, "media": medias}
647
-
648
- def extract_media(self, json_line: dict) -> List[Dict]:
649
- """
650
- Extract media from a parsed JSON line.
651
-
652
- Args:
653
- json_line (dict): Parsed JSON line.
654
-
655
- Returns:
656
- list: A list of dictionaries containing the extracted media.
657
- """
658
- medias = []
659
- imagine_card = json_line.get("imagine_card", {})
660
- session = imagine_card.get("session", {}) if imagine_card else {}
661
- media_sets = (
662
- (json_line.get("imagine_card", {}).get("session", {}).get("media_sets", []))
663
- if imagine_card and session
664
- else []
665
- )
666
- for media_set in media_sets:
667
- imagine_media = media_set.get("imagine_media", [])
668
- for media in imagine_media:
669
- medias.append(
670
- {
671
- "url": media.get("uri"),
672
- "type": media.get("media_type"),
673
- "prompt": media.get("prompt"),
674
- }
675
- )
676
- return medias
677
-
678
- def get_cookies(self) -> dict:
679
- """
680
- Extracts necessary cookies from the Meta AI main page.
681
-
682
- Returns:
683
- dict: A dictionary containing essential cookies.
684
- """
685
- session = HTMLSession()
686
- headers = {}
687
- if self.fb_email is not None and self.fb_password is not None:
688
- fb_session = get_fb_session(self.fb_email, self.fb_password, self.proxy)
689
- headers = {"cookie": f"abra_sess={fb_session['abra_sess']}"}
690
- response = session.get(
691
- "https://www.meta.ai/",
692
- headers=headers,
693
- proxies=self.proxy,
694
- )
695
- cookies = {
696
- "_js_datr": extract_value(
697
- response.text, start_str='_js_datr":{"value":"', end_str='",'
698
- ),
699
- "datr": extract_value(
700
- response.text, start_str='datr":{"value":"', end_str='",'
701
- ),
702
- "lsd": extract_value(
703
- response.text, start_str='"LSD",[],{"token":"', end_str='"}'
704
- ),
705
- "fb_dtsg": extract_value(
706
- response.text, start_str='DTSGInitData",[],{"token":"', end_str='"'
707
- ),
708
- }
709
-
710
- if len(headers) > 0:
711
- cookies["abra_sess"] = fb_session["abra_sess"]
712
- else:
713
- cookies["abra_csrf"] = extract_value(
714
- response.text, start_str='abra_csrf":{"value":"', end_str='",'
715
- )
716
- return cookies
717
-
718
- def fetch_sources(self, fetch_id: str) -> List[Dict]:
719
- """
720
- Fetches sources from the Meta AI API based on the given query.
721
-
722
- Args:
723
- fetch_id (str): The fetch ID to use for the query.
724
-
725
- Returns:
726
- list: A list of dictionaries containing the fetched sources.
727
- """
728
-
729
- url = "https://graph.meta.ai/graphql?locale=user"
730
- payload = {
731
- "access_token": self.access_token,
732
- "fb_api_caller_class": "RelayModern",
733
- "fb_api_req_friendly_name": "AbraSearchPluginDialogQuery",
734
- "variables": json.dumps({"abraMessageFetchID": fetch_id}),
735
- "server_timestamps": "true",
736
- "doc_id": "6946734308765963",
737
- }
738
-
739
- payload = urllib.parse.urlencode(payload) # noqa
740
-
741
- headers = {
742
- "authority": "graph.meta.ai",
743
- "accept-language": "en-US,en;q=0.9,fr-FR;q=0.8,fr;q=0.7",
744
- "content-type": "application/x-www-form-urlencoded",
745
- "cookie": f'dpr=2; abra_csrf={self.cookies.get("abra_csrf")}; datr={self.cookies.get("datr")}; ps_n=1; ps_l=1',
746
- "x-fb-friendly-name": "AbraSearchPluginDialogQuery",
747
- }
748
-
749
- response = self.session.post(url, headers=headers, data=payload)
750
- response_json = response.json()
751
- message = response_json.get("data", {}).get("message", {})
752
- search_results = (
753
- (response_json.get("data", {}).get("message", {}).get("searchResults"))
754
- if message
755
- else None
756
- )
757
- if search_results is None:
758
- return []
759
-
760
- references = search_results["references"]
761
- return references
762
-
763
- def get_message(self, response: dict) -> str:
764
- """Retrieves message only from response
765
-
766
- Args:
767
- response (dict): Response generated by `self.ask`
768
-
769
- Returns:
770
- str: Message extracted
771
- """
772
- assert isinstance(response, dict), "Response should be of dict data-type only"
773
- return response["message"]
774
-
775
- if __name__ == "__main__":
776
- Meta = Meta()
777
- ai = Meta.chat("hi")
778
- for chunk in ai:
779
- print(chunk, end="", flush=True)
1
+ import json
2
+ import logging
3
+ import time
4
+ import urllib
5
+ import uuid
6
+ from typing import Dict, Generator, Iterator, List, Union
7
+
8
+ import random
9
+ import requests
10
+ from webscout.scout import Scout
11
+
12
+ from webscout.AIutel import Optimizers
13
+ from webscout.AIutel import Conversation
14
+ from webscout.AIutel import AwesomePrompts, sanitize_stream
15
+ from webscout.AIbase import Provider
16
+ from webscout import exceptions
17
+
18
+ MAX_RETRIES = 3
19
+
20
+ def generate_offline_threading_id() -> str:
21
+ """
22
+ Generates an offline threading ID.
23
+
24
+ Returns:
25
+ str: The generated offline threading ID.
26
+ """
27
+ # Maximum value for a 64-bit integer in Python
28
+ max_int = (1 << 64) - 1
29
+ mask22_bits = (1 << 22) - 1
30
+
31
+ # Function to get the current timestamp in milliseconds
32
+ def get_current_timestamp():
33
+ return int(time.time() * 1000)
34
+
35
+ # Function to generate a random 64-bit integer
36
+ def get_random_64bit_int():
37
+ return random.getrandbits(64)
38
+
39
+ # Combine timestamp and random value
40
+ def combine_and_mask(timestamp, random_value):
41
+ shifted_timestamp = timestamp << 22
42
+ masked_random = random_value & mask22_bits
43
+ return (shifted_timestamp | masked_random) & max_int
44
+
45
+ timestamp = get_current_timestamp()
46
+ random_value = get_random_64bit_int()
47
+ threading_id = combine_and_mask(timestamp, random_value)
48
+
49
+ return str(threading_id)
50
+
51
+
52
+ def extract_value(text: str, start_str: str, end_str: str) -> str:
53
+ """
54
+ Helper function to extract a specific value from the given text using a key.
55
+
56
+ Args:
57
+ text (str): The text from which to extract the value.
58
+ start_str (str): The starting key.
59
+ end_str (str): The ending key.
60
+
61
+ Returns:
62
+ str: The extracted value.
63
+ """
64
+ start = text.find(start_str) + len(start_str)
65
+ end = text.find(end_str, start)
66
+ return text[start:end]
67
+
68
+
69
+ def format_response(response: dict) -> str:
70
+ """
71
+ Formats the response from Meta AI to remove unnecessary characters.
72
+
73
+ Args:
74
+ response (dict): The dictionnary containing the response to format.
75
+
76
+ Returns:
77
+ str: The formatted response.
78
+ """
79
+ text = ""
80
+ for content in (
81
+ response.get("data", {})
82
+ .get("node", {})
83
+ .get("bot_response_message", {})
84
+ .get("composed_text", {})
85
+ .get("content", [])
86
+ ):
87
+ text += content["text"] + "\n"
88
+ return text
89
+
90
+
91
+ # Function to perform the login
92
+ def get_fb_session(email, password, proxies=None):
93
+ login_url = "https://mbasic.facebook.com/login/"
94
+ headers = {
95
+ "authority": "mbasic.facebook.com",
96
+ "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
97
+ "accept-language": "en-US,en;q=0.9",
98
+ "sec-ch-ua": '"Chromium";v="122", "Not(A:Brand";v="24", "Google Chrome";v="122"',
99
+ "sec-ch-ua-mobile": "?0",
100
+ "sec-ch-ua-platform": '"macOS"',
101
+ "sec-fetch-dest": "document",
102
+ "sec-fetch-mode": "navigate",
103
+ "sec-fetch-site": "none",
104
+ "sec-fetch-user": "?1",
105
+ "upgrade-insecure-requests": "1",
106
+ "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
107
+ }
108
+ # Send the GET request
109
+ response = requests.get(login_url, headers=headers, proxies=proxies)
110
+
111
+ # Use Scout for parsing instead of BeautifulSoup
112
+ scout = Scout(response.text)
113
+
114
+ # Parse necessary parameters from the login form
115
+ lsd = scout.find_first('input[name="lsd"]').get('value')
116
+ jazoest = scout.find_first('input[name="jazoest"]').get('value')
117
+ li = scout.find_first('input[name="li"]').get('value')
118
+ m_ts = scout.find_first('input[name="m_ts"]').get('value')
119
+
120
+ # Define the URL and body for the POST request to submit the login form
121
+ post_url = "https://mbasic.facebook.com/login/device-based/regular/login/?refsrc=deprecated&lwv=100"
122
+ data = {
123
+ "lsd": lsd,
124
+ "jazoest": jazoest,
125
+ "m_ts": m_ts,
126
+ "li": li,
127
+ "try_number": "0",
128
+ "unrecognized_tries": "0",
129
+ "email": email,
130
+ "pass": password,
131
+ "login": "Log In",
132
+ "bi_xrwh": "0",
133
+ }
134
+
135
+ headers = {
136
+ "authority": "mbasic.facebook.com",
137
+ "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
138
+ "accept-language": "en-US,en;q=0.9",
139
+ "cache-control": "no-cache",
140
+ "content-type": "application/x-www-form-urlencoded",
141
+ "cookie": f"datr={response.cookies.get('datr')}; sb={response.cookies.get('sb')}; ps_n=1; ps_l=1",
142
+ "dpr": "2",
143
+ "origin": "https://mbasic.facebook.com",
144
+ "pragma": "no-cache",
145
+ "referer": "https://mbasic.facebook.com/login/",
146
+ "sec-fetch-site": "same-origin",
147
+ "sec-fetch-user": "?1",
148
+ "upgrade-insecure-requests": "1",
149
+ "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
150
+ "viewport-width": "1728",
151
+ }
152
+
153
+ # Send the POST request
154
+ session = requests.session()
155
+ session.proxies = proxies
156
+
157
+ result = session.post(post_url, headers=headers, data=data)
158
+ if "sb" not in session.cookies:
159
+ raise exceptions.FacebookInvalidCredentialsException(
160
+ "Was not able to login to Facebook. Please check your credentials. "
161
+ "You may also have been rate limited. Try to connect to Facebook manually."
162
+ )
163
+
164
+ cookies = {
165
+ **result.cookies.get_dict(),
166
+ "sb": session.cookies["sb"],
167
+ "xs": session.cookies["xs"],
168
+ "fr": session.cookies["fr"],
169
+ "c_user": session.cookies["c_user"],
170
+ }
171
+
172
+ response_login = {
173
+ "cookies": cookies,
174
+ "headers": result.headers,
175
+ "response": response.text,
176
+ }
177
+ meta_ai_cookies = get_cookies()
178
+
179
+ url = "https://www.meta.ai/state/"
180
+
181
+ payload = f'__a=1&lsd={meta_ai_cookies["lsd"]}'
182
+ headers = {
183
+ "authority": "www.meta.ai",
184
+ "accept": "*/*",
185
+ "accept-language": "en-US,en;q=0.9",
186
+ "cache-control": "no-cache",
187
+ "content-type": "application/x-www-form-urlencoded",
188
+ "cookie": f'ps_n=1; ps_l=1; dpr=2; _js_datr={meta_ai_cookies["_js_datr"]}; abra_csrf={meta_ai_cookies["abra_csrf"]}; datr={meta_ai_cookies["datr"]};; ps_l=1; ps_n=1',
189
+ "origin": "https://www.meta.ai",
190
+ "pragma": "no-cache",
191
+ "referer": "https://www.meta.ai/",
192
+ "sec-fetch-mode": "cors",
193
+ "sec-fetch-site": "same-origin",
194
+ "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
195
+ }
196
+
197
+ response = requests.request("POST", url, headers=headers, data=payload, proxies=proxies)
198
+
199
+ state = extract_value(response.text, start_str='"state":"', end_str='"')
200
+
201
+ url = f"https://www.facebook.com/oidc/?app_id=1358015658191005&scope=openid%20linking&response_type=code&redirect_uri=https%3A%2F%2Fwww.meta.ai%2Fauth%2F&no_universal_links=1&deoia=1&state={state}"
202
+ payload = {}
203
+ headers = {
204
+ "authority": "www.facebook.com",
205
+ "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
206
+ "accept-language": "en-US,en;q=0.9",
207
+ "cache-control": "no-cache",
208
+ "cookie": f"datr={response_login['cookies']['datr']}; sb={response_login['cookies']['sb']}; c_user={response_login['cookies']['c_user']}; xs={response_login['cookies']['xs']}; fr={response_login['cookies']['fr']}; m_page_voice={response_login['cookies']['m_page_voice']}; abra_csrf={meta_ai_cookies['abra_csrf']};",
209
+ "sec-fetch-dest": "document",
210
+ "sec-fetch-mode": "navigate",
211
+ "sec-fetch-site": "cross-site",
212
+ "sec-fetch-user": "?1",
213
+ "upgrade-insecure-requests": "1",
214
+ "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
215
+ }
216
+ session = requests.session()
217
+ session.proxies = proxies
218
+ response = session.get(url, headers=headers, data=payload, allow_redirects=False)
219
+
220
+ next_url = response.headers["Location"]
221
+
222
+ url = next_url
223
+
224
+ payload = {}
225
+ headers = {
226
+ "User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10.15; rv:125.0) Gecko/20100101 Firefox/125.0",
227
+ "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8",
228
+ "Accept-Language": "en-US,en;q=0.5",
229
+ "Accept-Encoding": "gzip, deflate, br",
230
+ "Referer": "https://www.meta.ai/",
231
+ "Connection": "keep-alive",
232
+ "Cookie": f'dpr=2; abra_csrf={meta_ai_cookies["abra_csrf"]}; datr={meta_ai_cookies["_js_datr"]}',
233
+ "Upgrade-Insecure-Requests": "1",
234
+ "Sec-Fetch-Dest": "document",
235
+ "Sec-Fetch-Mode": "navigate",
236
+ "Sec-Fetch-Site": "cross-site",
237
+ "Sec-Fetch-User": "?1",
238
+ "TE": "trailers",
239
+ }
240
+ session.get(url, headers=headers, data=payload)
241
+ cookies = session.cookies.get_dict()
242
+ if "abra_sess" not in cookies:
243
+ raise exceptions.FacebookInvalidCredentialsException(
244
+ "Was not able to login to Facebook. Please check your credentials. "
245
+ "You may also have been rate limited. Try to connect to Facebook manually."
246
+ )
247
+ logging.info("Successfully logged in to Facebook.")
248
+ return cookies
249
+
250
+
251
+ def get_cookies() -> dict:
252
+ """
253
+ Extracts necessary cookies from the Meta AI main page.
254
+
255
+ Returns:
256
+ dict: A dictionary containing essential cookies.
257
+ """
258
+ headers = {}
259
+ if self.fb_email is not None and self.fb_password is not None:
260
+ fb_session = get_fb_session(self.fb_email, self.fb_password, self.proxy)
261
+ headers = {"cookie": f"abra_sess={fb_session['abra_sess']}"}
262
+
263
+ response = requests.get(
264
+ "https://www.meta.ai/",
265
+ headers=headers,
266
+ proxies=self.proxy,
267
+ )
268
+
269
+ cookies = {
270
+ "_js_datr": extract_value(
271
+ response.text, start_str='_js_datr":{"value":"', end_str='",'
272
+ ),
273
+ "datr": extract_value(
274
+ response.text, start_str='datr":{"value":"', end_str='",'
275
+ ),
276
+ "lsd": extract_value(
277
+ response.text, start_str='"LSD",[],{"token":"', end_str='"}'
278
+ ),
279
+ "fb_dtsg": extract_value(
280
+ response.text, start_str='DTSGInitData",[],{"token":"', end_str='"'
281
+ ),
282
+ }
283
+
284
+ if len(headers) > 0:
285
+ cookies["abra_sess"] = fb_session["abra_sess"]
286
+ else:
287
+ cookies["abra_csrf"] = extract_value(
288
+ response.text, start_str='abra_csrf":{"value":"', end_str='",'
289
+ )
290
+ return cookies
291
+
292
+ class Meta(Provider):
293
+ """
294
+ A class to interact with the Meta AI API to obtain and use access tokens for sending
295
+ and receiving messages from the Meta AI Chat API.
296
+ """
297
+
298
+ def __init__(
299
+ self,
300
+ fb_email: str = None,
301
+ fb_password: str = None,
302
+ proxy: dict = None,
303
+ is_conversation: bool = True,
304
+ max_tokens: int = 600,
305
+ timeout: int = 30,
306
+ intro: str = None,
307
+ filepath: str = None,
308
+ update_file: bool = True,
309
+ proxies: dict = {},
310
+ history_offset: int = 10250,
311
+ act: str = None,
312
+ ):
313
+ """
314
+ Initializes the Meta AI API with given parameters.
315
+
316
+ Args:
317
+ fb_email (str, optional): Your Facebook email address. Defaults to None.
318
+ fb_password (str, optional): Your Facebook password. Defaults to None.
319
+ proxy (dict, optional): Proxy settings for requests. Defaults to None.
320
+ is_conversation (bool, optional): Flag for chatting conversationally. Defaults to True.
321
+ max_tokens (int, optional): Maximum number of tokens to be generated upon completion. Defaults to 600.
322
+ timeout (int, optional): Http request timeout. Defaults to 30.
323
+ intro (str, optional): Conversation introductory prompt. Defaults to None.
324
+ filepath (str, optional): Path to file containing conversation history. Defaults to None.
325
+ update_file (bool, optional): Add new prompts and responses to the file. Defaults to True.
326
+ proxies (dict, optional): Http request proxies. Defaults to {}.
327
+ history_offset (int, optional): Limit conversation history to this number of last texts. Defaults to 10250.
328
+ act (str|int, optional): Awesome prompt key or index. (Used as intro). Defaults to None.
329
+ """
330
+ self.session = requests.Session()
331
+ self.session.headers.update(
332
+ {
333
+ "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 "
334
+ "(KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
335
+ }
336
+ )
337
+ self.access_token = None
338
+ self.fb_email = fb_email
339
+ self.fb_password = fb_password
340
+ self.proxy = proxy
341
+ if self.proxy and not self.check_proxy():
342
+ raise ConnectionError(
343
+ "Unable to connect to proxy. Please check your proxy settings."
344
+ )
345
+ self.is_conversation = is_conversation
346
+ self.max_tokens_to_sample = max_tokens
347
+ self.timeout = timeout
348
+ self.last_response = {}
349
+ self.is_authed = fb_password is not None and fb_email is not None
350
+ self.cookies = self.get_cookies()
351
+ self.external_conversation_id = None
352
+ self.offline_threading_id = None
353
+
354
+ self.__available_optimizers = (
355
+ method
356
+ for method in dir(Optimizers)
357
+ if callable(getattr(Optimizers, method)) and not method.startswith("__")
358
+ )
359
+ Conversation.intro = (
360
+ AwesomePrompts().get_act(
361
+ act, raise_not_found=True, default=None, case_insensitive=True
362
+ )
363
+ if act
364
+ else intro or Conversation.intro
365
+ )
366
+ self.conversation = Conversation(
367
+ is_conversation, self.max_tokens_to_sample, filepath, update_file
368
+ )
369
+ self.conversation.history_offset = history_offset
370
+ self.session.proxies = proxies
371
+
372
+ def check_proxy(self, test_url: str = "https://api.ipify.org/?format=json") -> bool:
373
+ """
374
+ Checks the proxy connection by making a request to a test URL.
375
+
376
+ Args:
377
+ test_url (str): A test site from which we check that the proxy is installed correctly.
378
+
379
+ Returns:
380
+ bool: True if the proxy is working, False otherwise.
381
+ """
382
+ try:
383
+ response = self.session.get(test_url, proxies=self.proxy, timeout=10)
384
+ if response.status_code == 200:
385
+ self.session.proxies = self.proxy
386
+ return True
387
+ return False
388
+ except requests.RequestException:
389
+ return False
390
+
391
+ def get_access_token(self) -> str:
392
+ """
393
+ Retrieves an access token using Meta's authentication API.
394
+
395
+ Returns:
396
+ str: A valid access token.
397
+ """
398
+
399
+ if self.access_token:
400
+ return self.access_token
401
+
402
+ url = "https://www.meta.ai/api/graphql/"
403
+ payload = {
404
+ "lsd": self.cookies["lsd"],
405
+ "fb_api_caller_class": "RelayModern",
406
+ "fb_api_req_friendly_name": "useAbraAcceptTOSForTempUserMutation",
407
+ "variables": {
408
+ "dob": "1999-01-01",
409
+ "icebreaker_type": "TEXT",
410
+ "__relay_internal__pv__WebPixelRatiorelayprovider": 1,
411
+ },
412
+ "doc_id": "7604648749596940",
413
+ }
414
+ payload = urllib.parse.urlencode(payload) # noqa
415
+ headers = {
416
+ "content-type": "application/x-www-form-urlencoded",
417
+ "cookie": f'_js_datr={self.cookies["_js_datr"]}; '
418
+ f'abra_csrf={self.cookies["abra_csrf"]}; datr={self.cookies["datr"]};',
419
+ "sec-fetch-site": "same-origin",
420
+ "x-fb-friendly-name": "useAbraAcceptTOSForTempUserMutation",
421
+ }
422
+
423
+ response = self.session.post(url, headers=headers, data=payload)
424
+
425
+ try:
426
+ auth_json = response.json()
427
+ except json.JSONDecodeError:
428
+ raise exceptions.FacebookRegionBlocked(
429
+ "Unable to receive a valid response from Meta AI. This is likely due to your region being blocked. "
430
+ "Try manually accessing https://www.meta.ai/ to confirm."
431
+ )
432
+
433
+ access_token = auth_json["data"]["xab_abra_accept_terms_of_service"][
434
+ "new_temp_user_auth"
435
+ ]["access_token"]
436
+
437
+ # Need to sleep for a bit, for some reason the API doesn't like it when we send request too quickly
438
+ # (maybe Meta needs to register Cookies on their side?)
439
+ time.sleep(1)
440
+
441
+ return access_token
442
+
443
+ def ask(
444
+ self,
445
+ prompt: str,
446
+ stream: bool = False,
447
+ raw: bool = False,
448
+ optimizer: str = None,
449
+ conversationally: bool = False,
450
+ ) -> Union[Dict, Generator[Dict, None, None]]:
451
+ """
452
+ Sends a message to the Meta AI and returns the response.
453
+
454
+ Args:
455
+ prompt (str): The prompt to send.
456
+ stream (bool): Whether to stream the response or not. Defaults to False.
457
+ raw (bool, optional): Stream back raw response as received. Defaults to False.
458
+ optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
459
+ conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
460
+ Returns:
461
+ Union[Dict, Generator[Dict, None, None]]: A dictionary containing the response message and sources, or a generator yielding such dictionaries.
462
+ """
463
+ conversation_prompt = self.conversation.gen_complete_prompt(prompt)
464
+ if optimizer:
465
+ if optimizer in self.__available_optimizers:
466
+ conversation_prompt = getattr(Optimizers, optimizer)(
467
+ conversation_prompt if conversationally else prompt
468
+ )
469
+ else:
470
+ raise Exception(
471
+ f"Optimizer is not one of {self.__available_optimizers}"
472
+ )
473
+
474
+ if not self.is_authed:
475
+ self.access_token = self.get_access_token()
476
+ auth_payload = {"access_token": self.access_token}
477
+ url = "https://graph.meta.ai/graphql?locale=user"
478
+
479
+ else:
480
+ auth_payload = {"fb_dtsg": self.cookies["fb_dtsg"]}
481
+ url = "https://www.meta.ai/api/graphql/"
482
+
483
+ if not self.external_conversation_id:
484
+ external_id = str(uuid.uuid4())
485
+ self.external_conversation_id = external_id
486
+ payload = {
487
+ **auth_payload,
488
+ "fb_api_caller_class": "RelayModern",
489
+ "fb_api_req_friendly_name": "useAbraSendMessageMutation",
490
+ "variables": json.dumps(
491
+ {
492
+ "message": {"sensitive_string_value": conversation_prompt},
493
+ "externalConversationId": self.external_conversation_id,
494
+ "offlineThreadingId": generate_offline_threading_id(),
495
+ "suggestedPromptIndex": None,
496
+ "flashVideoRecapInput": {"images": []},
497
+ "flashPreviewInput": None,
498
+ "promptPrefix": None,
499
+ "entrypoint": "ABRA__CHAT__TEXT",
500
+ "icebreaker_type": "TEXT",
501
+ "__relay_internal__pv__AbraDebugDevOnlyrelayprovider": False,
502
+ "__relay_internal__pv__WebPixelRatiorelayprovider": 1,
503
+ }
504
+ ),
505
+ "server_timestamps": "true",
506
+ "doc_id": "7783822248314888",
507
+ }
508
+ payload = urllib.parse.urlencode(payload) # noqa
509
+ headers = {
510
+ "content-type": "application/x-www-form-urlencoded",
511
+ "x-fb-friendly-name": "useAbraSendMessageMutation",
512
+ }
513
+ if self.is_authed:
514
+ headers["cookie"] = f'abra_sess={self.cookies["abra_sess"]}'
515
+ # Recreate the session to avoid cookie leakage when user is authenticated
516
+ self.session = requests.Session()
517
+ self.session.proxies = self.proxy
518
+
519
+ if stream:
520
+
521
+ def for_stream():
522
+ response = self.session.post(
523
+ url, headers=headers, data=payload, stream=True, timeout=self.timeout
524
+ )
525
+ if not response.ok:
526
+ raise exceptions.FailedToGenerateResponseError(
527
+ f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
528
+ )
529
+
530
+ lines = response.iter_lines()
531
+ is_error = json.loads(next(lines))
532
+ if len(is_error.get("errors", [])) > 0:
533
+ raise exceptions.FailedToGenerateResponseError(
534
+ f"Failed to generate response - {response.text}"
535
+ )
536
+ for line in lines:
537
+ if line:
538
+ json_line = json.loads(line)
539
+ extracted_data = self.extract_data(json_line)
540
+ if not extracted_data.get("message"):
541
+ continue
542
+ self.last_response.update(extracted_data)
543
+ yield line if raw else extracted_data
544
+ self.conversation.update_chat_history(
545
+ prompt, self.get_message(self.last_response)
546
+ )
547
+
548
+ return for_stream()
549
+ else:
550
+ response = self.session.post(
551
+ url, headers=headers, data=payload, timeout=self.timeout
552
+ )
553
+ if not response.ok:
554
+ raise exceptions.FailedToGenerateResponseError(
555
+ f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
556
+ )
557
+ raw_response = response.text
558
+ last_streamed_response = self.extract_last_response(raw_response)
559
+ if not last_streamed_response:
560
+ raise exceptions.FailedToGenerateResponseError(
561
+ f"Failed to generate response - {response.text}"
562
+ )
563
+
564
+ extracted_data = self.extract_data(last_streamed_response)
565
+ self.last_response.update(extracted_data)
566
+ self.conversation.update_chat_history(
567
+ prompt, self.get_message(self.last_response)
568
+ )
569
+ return extracted_data
570
+
571
+ def chat(
572
+ self,
573
+ prompt: str,
574
+ stream: bool = False,
575
+ optimizer: str = None,
576
+ conversationally: bool = False,
577
+ ) -> str:
578
+ """
579
+ Sends a message to the Meta AI and returns the response.
580
+
581
+ Args:
582
+ prompt (str): The message to send.
583
+ stream (bool): Whether to stream the response or not. Defaults to False.
584
+ optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
585
+ conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
586
+
587
+ Returns:
588
+ str: The response message.
589
+ """
590
+
591
+ def for_stream():
592
+ for response in self.ask(
593
+ prompt, True, optimizer=optimizer, conversationally=conversationally
594
+ ):
595
+ yield self.get_message(response)
596
+
597
+ def for_non_stream():
598
+ return self.get_message(
599
+ self.ask(
600
+ prompt,
601
+ False,
602
+ optimizer=optimizer,
603
+ conversationally=conversationally,
604
+ )
605
+ )
606
+
607
+ return for_stream() if stream else for_non_stream()
608
+
609
+ def extract_last_response(self, response: str) -> Dict:
610
+ """
611
+ Extracts the last response from the Meta AI API.
612
+
613
+ Args:
614
+ response (str): The response to extract the last response from.
615
+
616
+ Returns:
617
+ dict: A dictionary containing the last response.
618
+ """
619
+ last_streamed_response = None
620
+ for line in response.split("\n"):
621
+ try:
622
+ json_line = json.loads(line)
623
+ except json.JSONDecodeError:
624
+ continue
625
+
626
+ bot_response_message = (
627
+ json_line.get("data", {})
628
+ .get("node", {})
629
+ .get("bot_response_message", {})
630
+ )
631
+ chat_id = bot_response_message.get("id")
632
+ if chat_id:
633
+ external_conversation_id, offline_threading_id, _ = chat_id.split("_")
634
+ self.external_conversation_id = external_conversation_id
635
+ self.offline_threading_id = offline_threading_id
636
+
637
+ streaming_state = bot_response_message.get("streaming_state")
638
+ if streaming_state == "OVERALL_DONE":
639
+ last_streamed_response = json_line
640
+
641
+ return last_streamed_response
642
+
643
+ def extract_data(self, json_line: dict) -> Dict:
644
+ """
645
+ Extract data and sources from a parsed JSON line.
646
+
647
+ Args:
648
+ json_line (dict): Parsed JSON line.
649
+
650
+ Returns:
651
+ dict: A dictionary containing the response message, sources, and media.
652
+ """
653
+ bot_response_message = (
654
+ json_line.get("data", {}).get("node", {}).get("bot_response_message", {})
655
+ )
656
+ response = format_response(response=json_line)
657
+ fetch_id = bot_response_message.get("fetch_id")
658
+ sources = self.fetch_sources(fetch_id) if fetch_id else []
659
+ medias = self.extract_media(bot_response_message)
660
+ return {"message": response, "sources": sources, "media": medias}
661
+
662
+ def extract_media(self, json_line: dict) -> List[Dict]:
663
+ """
664
+ Extract media from a parsed JSON line.
665
+
666
+ Args:
667
+ json_line (dict): Parsed JSON line.
668
+
669
+ Returns:
670
+ list: A list of dictionaries containing the extracted media.
671
+ """
672
+ medias = []
673
+ imagine_card = json_line.get("imagine_card", {})
674
+ session = imagine_card.get("session", {}) if imagine_card else {}
675
+ media_sets = (
676
+ (json_line.get("imagine_card", {}).get("session", {}).get("media_sets", []))
677
+ if imagine_card and session
678
+ else []
679
+ )
680
+ for media_set in media_sets:
681
+ imagine_media = media_set.get("imagine_media", [])
682
+ for media in imagine_media:
683
+ medias.append(
684
+ {
685
+ "url": media.get("uri"),
686
+ "type": media.get("media_type"),
687
+ "prompt": media.get("prompt"),
688
+ }
689
+ )
690
+ return medias
691
+
692
+ def get_cookies(self) -> dict:
693
+ """
694
+ Extracts necessary cookies from the Meta AI main page.
695
+
696
+ Returns:
697
+ dict: A dictionary containing essential cookies.
698
+ """
699
+ headers = {}
700
+ if self.fb_email is not None and self.fb_password is not None:
701
+ fb_session = get_fb_session(self.fb_email, self.fb_password, self.proxy)
702
+ headers = {"cookie": f"abra_sess={fb_session['abra_sess']}"}
703
+
704
+ response = requests.get(
705
+ "https://www.meta.ai/",
706
+ headers=headers,
707
+ proxies=self.proxy,
708
+ )
709
+
710
+ cookies = {
711
+ "_js_datr": extract_value(
712
+ response.text, start_str='_js_datr":{"value":"', end_str='",'
713
+ ),
714
+ "datr": extract_value(
715
+ response.text, start_str='datr":{"value":"', end_str='",'
716
+ ),
717
+ "lsd": extract_value(
718
+ response.text, start_str='"LSD",[],{"token":"', end_str='"}'
719
+ ),
720
+ "fb_dtsg": extract_value(
721
+ response.text, start_str='DTSGInitData",[],{"token":"', end_str='"'
722
+ ),
723
+ }
724
+
725
+ if len(headers) > 0:
726
+ cookies["abra_sess"] = fb_session["abra_sess"]
727
+ else:
728
+ cookies["abra_csrf"] = extract_value(
729
+ response.text, start_str='abra_csrf":{"value":"', end_str='",'
730
+ )
731
+ return cookies
732
+
733
+ def fetch_sources(self, fetch_id: str) -> List[Dict]:
734
+ """
735
+ Fetches sources from the Meta AI API based on the given query.
736
+
737
+ Args:
738
+ fetch_id (str): The fetch ID to use for the query.
739
+
740
+ Returns:
741
+ list: A list of dictionaries containing the fetched sources.
742
+ """
743
+
744
+ url = "https://graph.meta.ai/graphql?locale=user"
745
+ payload = {
746
+ "access_token": self.access_token,
747
+ "fb_api_caller_class": "RelayModern",
748
+ "fb_api_req_friendly_name": "AbraSearchPluginDialogQuery",
749
+ "variables": json.dumps({"abraMessageFetchID": fetch_id}),
750
+ "server_timestamps": "true",
751
+ "doc_id": "6946734308765963",
752
+ }
753
+
754
+ payload = urllib.parse.urlencode(payload) # noqa
755
+
756
+ headers = {
757
+ "authority": "graph.meta.ai",
758
+ "accept-language": "en-US,en;q=0.9,fr-FR;q=0.8,fr;q=0.7",
759
+ "content-type": "application/x-www-form-urlencoded",
760
+ "cookie": f'dpr=2; abra_csrf={self.cookies.get("abra_csrf")}; datr={self.cookies.get("datr")}; ps_n=1; ps_l=1',
761
+ "x-fb-friendly-name": "AbraSearchPluginDialogQuery",
762
+ }
763
+
764
+ response = self.session.post(url, headers=headers, data=payload)
765
+ response_json = response.json()
766
+ message = response_json.get("data", {}).get("message", {})
767
+ search_results = (
768
+ (response_json.get("data", {}).get("message", {}).get("searchResults"))
769
+ if message
770
+ else None
771
+ )
772
+ if search_results is None:
773
+ return []
774
+
775
+ references = search_results["references"]
776
+ return references
777
+
778
+ def get_message(self, response: dict) -> str:
779
+ """Retrieves message only from response
780
+
781
+ Args:
782
+ response (dict): Response generated by `self.ask`
783
+
784
+ Returns:
785
+ str: Message extracted
786
+ """
787
+ assert isinstance(response, dict), "Response should be of dict data-type only"
788
+ return response["message"]
789
+
790
+ if __name__ == "__main__":
791
+ Meta = Meta()
792
+ ai = Meta.chat("hi")
793
+ for chunk in ai:
794
+ print(chunk, end="", flush=True)