webscout 7.0__py3-none-any.whl → 7.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of webscout might be problematic. Click here for more details.

Files changed (147) hide show
  1. webscout/AIauto.py +191 -191
  2. webscout/AIbase.py +122 -122
  3. webscout/AIutel.py +440 -440
  4. webscout/Bard.py +343 -161
  5. webscout/DWEBS.py +489 -492
  6. webscout/Extra/YTToolkit/YTdownloader.py +995 -995
  7. webscout/Extra/YTToolkit/__init__.py +2 -2
  8. webscout/Extra/YTToolkit/transcriber.py +476 -479
  9. webscout/Extra/YTToolkit/ytapi/channel.py +307 -307
  10. webscout/Extra/YTToolkit/ytapi/playlist.py +58 -58
  11. webscout/Extra/YTToolkit/ytapi/pool.py +7 -7
  12. webscout/Extra/YTToolkit/ytapi/utils.py +62 -62
  13. webscout/Extra/YTToolkit/ytapi/video.py +103 -103
  14. webscout/Extra/autocoder/__init__.py +9 -9
  15. webscout/Extra/autocoder/autocoder_utiles.py +199 -199
  16. webscout/Extra/autocoder/rawdog.py +5 -7
  17. webscout/Extra/autollama.py +230 -230
  18. webscout/Extra/gguf.py +3 -3
  19. webscout/Extra/weather.py +171 -171
  20. webscout/LLM.py +442 -442
  21. webscout/Litlogger/__init__.py +67 -681
  22. webscout/Litlogger/core/__init__.py +6 -0
  23. webscout/Litlogger/core/level.py +20 -0
  24. webscout/Litlogger/core/logger.py +123 -0
  25. webscout/Litlogger/handlers/__init__.py +12 -0
  26. webscout/Litlogger/handlers/console.py +50 -0
  27. webscout/Litlogger/handlers/file.py +143 -0
  28. webscout/Litlogger/handlers/network.py +174 -0
  29. webscout/Litlogger/styles/__init__.py +7 -0
  30. webscout/Litlogger/styles/colors.py +231 -0
  31. webscout/Litlogger/styles/formats.py +377 -0
  32. webscout/Litlogger/styles/text.py +87 -0
  33. webscout/Litlogger/utils/__init__.py +6 -0
  34. webscout/Litlogger/utils/detectors.py +154 -0
  35. webscout/Litlogger/utils/formatters.py +200 -0
  36. webscout/Provider/AISEARCH/DeepFind.py +250 -250
  37. webscout/Provider/Blackboxai.py +136 -137
  38. webscout/Provider/ChatGPTGratis.py +226 -0
  39. webscout/Provider/Cloudflare.py +91 -78
  40. webscout/Provider/DeepSeek.py +218 -0
  41. webscout/Provider/Deepinfra.py +59 -35
  42. webscout/Provider/Free2GPT.py +131 -124
  43. webscout/Provider/Gemini.py +100 -115
  44. webscout/Provider/Glider.py +74 -59
  45. webscout/Provider/Groq.py +30 -18
  46. webscout/Provider/Jadve.py +108 -77
  47. webscout/Provider/Llama3.py +117 -94
  48. webscout/Provider/Marcus.py +191 -137
  49. webscout/Provider/Netwrck.py +62 -50
  50. webscout/Provider/PI.py +79 -124
  51. webscout/Provider/PizzaGPT.py +129 -83
  52. webscout/Provider/QwenLM.py +311 -0
  53. webscout/Provider/TTI/AiForce/__init__.py +22 -22
  54. webscout/Provider/TTI/AiForce/async_aiforce.py +257 -257
  55. webscout/Provider/TTI/AiForce/sync_aiforce.py +242 -242
  56. webscout/Provider/TTI/Nexra/__init__.py +22 -22
  57. webscout/Provider/TTI/Nexra/async_nexra.py +286 -286
  58. webscout/Provider/TTI/Nexra/sync_nexra.py +258 -258
  59. webscout/Provider/TTI/PollinationsAI/__init__.py +23 -23
  60. webscout/Provider/TTI/PollinationsAI/async_pollinations.py +330 -330
  61. webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +285 -285
  62. webscout/Provider/TTI/artbit/__init__.py +22 -22
  63. webscout/Provider/TTI/artbit/async_artbit.py +184 -184
  64. webscout/Provider/TTI/artbit/sync_artbit.py +176 -176
  65. webscout/Provider/TTI/blackbox/__init__.py +4 -4
  66. webscout/Provider/TTI/blackbox/async_blackbox.py +212 -212
  67. webscout/Provider/TTI/blackbox/sync_blackbox.py +199 -199
  68. webscout/Provider/TTI/deepinfra/__init__.py +4 -4
  69. webscout/Provider/TTI/deepinfra/async_deepinfra.py +227 -227
  70. webscout/Provider/TTI/deepinfra/sync_deepinfra.py +199 -199
  71. webscout/Provider/TTI/huggingface/__init__.py +22 -22
  72. webscout/Provider/TTI/huggingface/async_huggingface.py +199 -199
  73. webscout/Provider/TTI/huggingface/sync_huggingface.py +195 -195
  74. webscout/Provider/TTI/imgninza/__init__.py +4 -4
  75. webscout/Provider/TTI/imgninza/async_ninza.py +214 -214
  76. webscout/Provider/TTI/imgninza/sync_ninza.py +209 -209
  77. webscout/Provider/TTI/talkai/__init__.py +4 -4
  78. webscout/Provider/TTI/talkai/async_talkai.py +229 -229
  79. webscout/Provider/TTI/talkai/sync_talkai.py +207 -207
  80. webscout/Provider/TTS/deepgram.py +182 -182
  81. webscout/Provider/TTS/elevenlabs.py +136 -136
  82. webscout/Provider/TTS/gesserit.py +150 -150
  83. webscout/Provider/TTS/murfai.py +138 -138
  84. webscout/Provider/TTS/parler.py +133 -134
  85. webscout/Provider/TTS/streamElements.py +360 -360
  86. webscout/Provider/TTS/utils.py +280 -280
  87. webscout/Provider/TTS/voicepod.py +116 -116
  88. webscout/Provider/TextPollinationsAI.py +74 -47
  89. webscout/Provider/WiseCat.py +193 -0
  90. webscout/Provider/__init__.py +144 -136
  91. webscout/Provider/cerebras.py +242 -227
  92. webscout/Provider/chatglm.py +204 -204
  93. webscout/Provider/dgaf.py +67 -39
  94. webscout/Provider/gaurish.py +105 -66
  95. webscout/Provider/geminiapi.py +208 -208
  96. webscout/Provider/granite.py +223 -0
  97. webscout/Provider/hermes.py +218 -218
  98. webscout/Provider/llama3mitril.py +179 -179
  99. webscout/Provider/llamatutor.py +72 -62
  100. webscout/Provider/llmchat.py +60 -35
  101. webscout/Provider/meta.py +794 -794
  102. webscout/Provider/multichat.py +331 -230
  103. webscout/Provider/typegpt.py +359 -356
  104. webscout/Provider/yep.py +5 -5
  105. webscout/__main__.py +5 -5
  106. webscout/cli.py +319 -319
  107. webscout/conversation.py +241 -242
  108. webscout/exceptions.py +328 -328
  109. webscout/litagent/__init__.py +28 -28
  110. webscout/litagent/agent.py +2 -3
  111. webscout/litprinter/__init__.py +0 -58
  112. webscout/scout/__init__.py +8 -8
  113. webscout/scout/core.py +884 -884
  114. webscout/scout/element.py +459 -459
  115. webscout/scout/parsers/__init__.py +69 -69
  116. webscout/scout/parsers/html5lib_parser.py +172 -172
  117. webscout/scout/parsers/html_parser.py +236 -236
  118. webscout/scout/parsers/lxml_parser.py +178 -178
  119. webscout/scout/utils.py +38 -38
  120. webscout/swiftcli/__init__.py +811 -811
  121. webscout/update_checker.py +2 -12
  122. webscout/version.py +1 -1
  123. webscout/webscout_search.py +1142 -1140
  124. webscout/webscout_search_async.py +635 -635
  125. webscout/zeroart/__init__.py +54 -54
  126. webscout/zeroart/base.py +60 -60
  127. webscout/zeroart/effects.py +99 -99
  128. webscout/zeroart/fonts.py +816 -816
  129. {webscout-7.0.dist-info → webscout-7.2.dist-info}/METADATA +21 -28
  130. webscout-7.2.dist-info/RECORD +217 -0
  131. webstoken/__init__.py +30 -30
  132. webstoken/classifier.py +189 -189
  133. webstoken/keywords.py +216 -216
  134. webstoken/language.py +128 -128
  135. webstoken/ner.py +164 -164
  136. webstoken/normalizer.py +35 -35
  137. webstoken/processor.py +77 -77
  138. webstoken/sentiment.py +206 -206
  139. webstoken/stemmer.py +73 -73
  140. webstoken/tagger.py +60 -60
  141. webstoken/tokenizer.py +158 -158
  142. webscout/Provider/RUBIKSAI.py +0 -272
  143. webscout-7.0.dist-info/RECORD +0 -199
  144. {webscout-7.0.dist-info → webscout-7.2.dist-info}/LICENSE.md +0 -0
  145. {webscout-7.0.dist-info → webscout-7.2.dist-info}/WHEEL +0 -0
  146. {webscout-7.0.dist-info → webscout-7.2.dist-info}/entry_points.txt +0 -0
  147. {webscout-7.0.dist-info → webscout-7.2.dist-info}/top_level.txt +0 -0
webscout/Provider/meta.py CHANGED
@@ -1,794 +1,794 @@
1
- import json
2
- import logging
3
- import time
4
- import urllib
5
- import uuid
6
- from typing import Dict, Generator, Iterator, List, Union
7
-
8
- import random
9
- import requests
10
- from webscout.scout import Scout
11
-
12
- from webscout.AIutel import Optimizers
13
- from webscout.AIutel import Conversation
14
- from webscout.AIutel import AwesomePrompts, sanitize_stream
15
- from webscout.AIbase import Provider
16
- from webscout import exceptions
17
- from webscout import LitAgent as Lit
18
- MAX_RETRIES = 3
19
-
20
- def generate_offline_threading_id() -> str:
21
- """
22
- Generates an offline threading ID.
23
-
24
- Returns:
25
- str: The generated offline threading ID.
26
- """
27
- # Maximum value for a 64-bit integer in Python
28
- max_int = (1 << 64) - 1
29
- mask22_bits = (1 << 22) - 1
30
-
31
- # Function to get the current timestamp in milliseconds
32
- def get_current_timestamp():
33
- return int(time.time() * 1000)
34
-
35
- # Function to generate a random 64-bit integer
36
- def get_random_64bit_int():
37
- return random.getrandbits(64)
38
-
39
- # Combine timestamp and random value
40
- def combine_and_mask(timestamp, random_value):
41
- shifted_timestamp = timestamp << 22
42
- masked_random = random_value & mask22_bits
43
- return (shifted_timestamp | masked_random) & max_int
44
-
45
- timestamp = get_current_timestamp()
46
- random_value = get_random_64bit_int()
47
- threading_id = combine_and_mask(timestamp, random_value)
48
-
49
- return str(threading_id)
50
-
51
-
52
- def extract_value(text: str, start_str: str, end_str: str) -> str:
53
- """
54
- Helper function to extract a specific value from the given text using a key.
55
-
56
- Args:
57
- text (str): The text from which to extract the value.
58
- start_str (str): The starting key.
59
- end_str (str): The ending key.
60
-
61
- Returns:
62
- str: The extracted value.
63
- """
64
- start = text.find(start_str) + len(start_str)
65
- end = text.find(end_str, start)
66
- return text[start:end]
67
-
68
-
69
- def format_response(response: dict) -> str:
70
- """
71
- Formats the response from Meta AI to remove unnecessary characters.
72
-
73
- Args:
74
- response (dict): The dictionnary containing the response to format.
75
-
76
- Returns:
77
- str: The formatted response.
78
- """
79
- text = ""
80
- for content in (
81
- response.get("data", {})
82
- .get("node", {})
83
- .get("bot_response_message", {})
84
- .get("composed_text", {})
85
- .get("content", [])
86
- ):
87
- text += content["text"] + "\n"
88
- return text
89
-
90
-
91
- # Function to perform the login
92
- def get_fb_session(email, password, proxies=None):
93
- login_url = "https://mbasic.facebook.com/login/"
94
- headers = {
95
- "authority": "mbasic.facebook.com",
96
- "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
97
- "accept-language": "en-US,en;q=0.9",
98
- "sec-ch-ua": '"Chromium";v="122", "Not(A:Brand";v="24", "Google Chrome";v="122"',
99
- "sec-ch-ua-mobile": "?0",
100
- "sec-ch-ua-platform": '"macOS"',
101
- "sec-fetch-dest": "document",
102
- "sec-fetch-mode": "navigate",
103
- "sec-fetch-site": "none",
104
- "sec-fetch-user": "?1",
105
- "upgrade-insecure-requests": "1",
106
- "user-agent": Lit().random(),
107
- }
108
- # Send the GET request
109
- response = requests.get(login_url, headers=headers, proxies=proxies)
110
-
111
- # Use Scout for parsing instead of BeautifulSoup
112
- scout = Scout(response.text)
113
-
114
- # Parse necessary parameters from the login form
115
- lsd = scout.find_first('input[name="lsd"]').get('value')
116
- jazoest = scout.find_first('input[name="jazoest"]').get('value')
117
- li = scout.find_first('input[name="li"]').get('value')
118
- m_ts = scout.find_first('input[name="m_ts"]').get('value')
119
-
120
- # Define the URL and body for the POST request to submit the login form
121
- post_url = "https://mbasic.facebook.com/login/device-based/regular/login/?refsrc=deprecated&lwv=100"
122
- data = {
123
- "lsd": lsd,
124
- "jazoest": jazoest,
125
- "m_ts": m_ts,
126
- "li": li,
127
- "try_number": "0",
128
- "unrecognized_tries": "0",
129
- "email": email,
130
- "pass": password,
131
- "login": "Log In",
132
- "bi_xrwh": "0",
133
- }
134
-
135
- headers = {
136
- "authority": "mbasic.facebook.com",
137
- "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
138
- "accept-language": "en-US,en;q=0.9",
139
- "cache-control": "no-cache",
140
- "content-type": "application/x-www-form-urlencoded",
141
- "cookie": f"datr={response.cookies.get('datr')}; sb={response.cookies.get('sb')}; ps_n=1; ps_l=1",
142
- "dpr": "2",
143
- "origin": "https://mbasic.facebook.com",
144
- "pragma": "no-cache",
145
- "referer": "https://mbasic.facebook.com/login/",
146
- "sec-fetch-site": "same-origin",
147
- "sec-fetch-user": "?1",
148
- "upgrade-insecure-requests": "1",
149
- "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
150
- "viewport-width": "1728",
151
- }
152
-
153
- # Send the POST request
154
- session = requests.session()
155
- session.proxies = proxies
156
-
157
- result = session.post(post_url, headers=headers, data=data)
158
- if "sb" not in session.cookies:
159
- raise exceptions.FacebookInvalidCredentialsException(
160
- "Was not able to login to Facebook. Please check your credentials. "
161
- "You may also have been rate limited. Try to connect to Facebook manually."
162
- )
163
-
164
- cookies = {
165
- **result.cookies.get_dict(),
166
- "sb": session.cookies["sb"],
167
- "xs": session.cookies["xs"],
168
- "fr": session.cookies["fr"],
169
- "c_user": session.cookies["c_user"],
170
- }
171
-
172
- response_login = {
173
- "cookies": cookies,
174
- "headers": result.headers,
175
- "response": response.text,
176
- }
177
- meta_ai_cookies = get_cookies()
178
-
179
- url = "https://www.meta.ai/state/"
180
-
181
- payload = f'__a=1&lsd={meta_ai_cookies["lsd"]}'
182
- headers = {
183
- "authority": "www.meta.ai",
184
- "accept": "*/*",
185
- "accept-language": "en-US,en;q=0.9",
186
- "cache-control": "no-cache",
187
- "content-type": "application/x-www-form-urlencoded",
188
- "cookie": f'ps_n=1; ps_l=1; dpr=2; _js_datr={meta_ai_cookies["_js_datr"]}; abra_csrf={meta_ai_cookies["abra_csrf"]}; datr={meta_ai_cookies["datr"]};; ps_l=1; ps_n=1',
189
- "origin": "https://www.meta.ai",
190
- "pragma": "no-cache",
191
- "referer": "https://www.meta.ai/",
192
- "sec-fetch-mode": "cors",
193
- "sec-fetch-site": "same-origin",
194
- "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
195
- }
196
-
197
- response = requests.request("POST", url, headers=headers, data=payload, proxies=proxies)
198
-
199
- state = extract_value(response.text, start_str='"state":"', end_str='"')
200
-
201
- url = f"https://www.facebook.com/oidc/?app_id=1358015658191005&scope=openid%20linking&response_type=code&redirect_uri=https%3A%2F%2Fwww.meta.ai%2Fauth%2F&no_universal_links=1&deoia=1&state={state}"
202
- payload = {}
203
- headers = {
204
- "authority": "www.facebook.com",
205
- "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
206
- "accept-language": "en-US,en;q=0.9",
207
- "cache-control": "no-cache",
208
- "cookie": f"datr={response_login['cookies']['datr']}; sb={response_login['cookies']['sb']}; c_user={response_login['cookies']['c_user']}; xs={response_login['cookies']['xs']}; fr={response_login['cookies']['fr']}; m_page_voice={response_login['cookies']['m_page_voice']}; abra_csrf={meta_ai_cookies['abra_csrf']};",
209
- "sec-fetch-dest": "document",
210
- "sec-fetch-mode": "navigate",
211
- "sec-fetch-site": "cross-site",
212
- "sec-fetch-user": "?1",
213
- "upgrade-insecure-requests": "1",
214
- "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
215
- }
216
- session = requests.session()
217
- session.proxies = proxies
218
- response = session.get(url, headers=headers, data=payload, allow_redirects=False)
219
-
220
- next_url = response.headers["Location"]
221
-
222
- url = next_url
223
-
224
- payload = {}
225
- headers = {
226
- "User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10.15; rv:125.0) Gecko/20100101 Firefox/125.0",
227
- "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8",
228
- "Accept-Language": "en-US,en;q=0.5",
229
- "Accept-Encoding": "gzip, deflate, br",
230
- "Referer": "https://www.meta.ai/",
231
- "Connection": "keep-alive",
232
- "Cookie": f'dpr=2; abra_csrf={meta_ai_cookies["abra_csrf"]}; datr={meta_ai_cookies["_js_datr"]}',
233
- "Upgrade-Insecure-Requests": "1",
234
- "Sec-Fetch-Dest": "document",
235
- "Sec-Fetch-Mode": "navigate",
236
- "Sec-Fetch-Site": "cross-site",
237
- "Sec-Fetch-User": "?1",
238
- "TE": "trailers",
239
- }
240
- session.get(url, headers=headers, data=payload)
241
- cookies = session.cookies.get_dict()
242
- if "abra_sess" not in cookies:
243
- raise exceptions.FacebookInvalidCredentialsException(
244
- "Was not able to login to Facebook. Please check your credentials. "
245
- "You may also have been rate limited. Try to connect to Facebook manually."
246
- )
247
- logging.info("Successfully logged in to Facebook.")
248
- return cookies
249
-
250
-
251
- def get_cookies(self) -> dict:
252
- """
253
- Extracts necessary cookies from the Meta AI main page.
254
-
255
- Returns:
256
- dict: A dictionary containing essential cookies.
257
- """
258
- headers = {}
259
- if self.fb_email is not None and self.fb_password is not None:
260
- fb_session = get_fb_session(self.fb_email, self.fb_password, self.proxy)
261
- headers = {"cookie": f"abra_sess={fb_session['abra_sess']}"}
262
-
263
- response = requests.get(
264
- "https://www.meta.ai/",
265
- headers=headers,
266
- proxies=self.proxy,
267
- )
268
-
269
- cookies = {
270
- "_js_datr": extract_value(
271
- response.text, start_str='_js_datr":{"value":"', end_str='",'
272
- ),
273
- "datr": extract_value(
274
- response.text, start_str='datr":{"value":"', end_str='",'
275
- ),
276
- "lsd": extract_value(
277
- response.text, start_str='"LSD",[],{"token":"', end_str='"}'
278
- ),
279
- "fb_dtsg": extract_value(
280
- response.text, start_str='DTSGInitData",[],{"token":"', end_str='"'
281
- ),
282
- }
283
-
284
- if len(headers) > 0:
285
- cookies["abra_sess"] = fb_session["abra_sess"]
286
- else:
287
- cookies["abra_csrf"] = extract_value(
288
- response.text, start_str='abra_csrf":{"value":"', end_str='",'
289
- )
290
- return cookies
291
-
292
- class Meta(Provider):
293
- """
294
- A class to interact with the Meta AI API to obtain and use access tokens for sending
295
- and receiving messages from the Meta AI Chat API.
296
- """
297
-
298
- def __init__(
299
- self,
300
- fb_email: str = None,
301
- fb_password: str = None,
302
- proxy: dict = None,
303
- is_conversation: bool = True,
304
- max_tokens: int = 600,
305
- timeout: int = 30,
306
- intro: str = None,
307
- filepath: str = None,
308
- update_file: bool = True,
309
- proxies: dict = {},
310
- history_offset: int = 10250,
311
- act: str = None,
312
- ):
313
- """
314
- Initializes the Meta AI API with given parameters.
315
-
316
- Args:
317
- fb_email (str, optional): Your Facebook email address. Defaults to None.
318
- fb_password (str, optional): Your Facebook password. Defaults to None.
319
- proxy (dict, optional): Proxy settings for requests. Defaults to None.
320
- is_conversation (bool, optional): Flag for chatting conversationally. Defaults to True.
321
- max_tokens (int, optional): Maximum number of tokens to be generated upon completion. Defaults to 600.
322
- timeout (int, optional): Http request timeout. Defaults to 30.
323
- intro (str, optional): Conversation introductory prompt. Defaults to None.
324
- filepath (str, optional): Path to file containing conversation history. Defaults to None.
325
- update_file (bool, optional): Add new prompts and responses to the file. Defaults to True.
326
- proxies (dict, optional): Http request proxies. Defaults to {}.
327
- history_offset (int, optional): Limit conversation history to this number of last texts. Defaults to 10250.
328
- act (str|int, optional): Awesome prompt key or index. (Used as intro). Defaults to None.
329
- """
330
- self.session = requests.Session()
331
- self.session.headers.update(
332
- {
333
- "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 "
334
- "(KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
335
- }
336
- )
337
- self.access_token = None
338
- self.fb_email = fb_email
339
- self.fb_password = fb_password
340
- self.proxy = proxy
341
- if self.proxy and not self.check_proxy():
342
- raise ConnectionError(
343
- "Unable to connect to proxy. Please check your proxy settings."
344
- )
345
- self.is_conversation = is_conversation
346
- self.max_tokens_to_sample = max_tokens
347
- self.timeout = timeout
348
- self.last_response = {}
349
- self.is_authed = fb_password is not None and fb_email is not None
350
- self.cookies = self.get_cookies()
351
- self.external_conversation_id = None
352
- self.offline_threading_id = None
353
-
354
- self.__available_optimizers = (
355
- method
356
- for method in dir(Optimizers)
357
- if callable(getattr(Optimizers, method)) and not method.startswith("__")
358
- )
359
- Conversation.intro = (
360
- AwesomePrompts().get_act(
361
- act, raise_not_found=True, default=None, case_insensitive=True
362
- )
363
- if act
364
- else intro or Conversation.intro
365
- )
366
- self.conversation = Conversation(
367
- is_conversation, self.max_tokens_to_sample, filepath, update_file
368
- )
369
- self.conversation.history_offset = history_offset
370
- self.session.proxies = proxies
371
-
372
- def check_proxy(self, test_url: str = "https://api.ipify.org/?format=json") -> bool:
373
- """
374
- Checks the proxy connection by making a request to a test URL.
375
-
376
- Args:
377
- test_url (str): A test site from which we check that the proxy is installed correctly.
378
-
379
- Returns:
380
- bool: True if the proxy is working, False otherwise.
381
- """
382
- try:
383
- response = self.session.get(test_url, proxies=self.proxy, timeout=10)
384
- if response.status_code == 200:
385
- self.session.proxies = self.proxy
386
- return True
387
- return False
388
- except requests.RequestException:
389
- return False
390
-
391
- def get_access_token(self) -> str:
392
- """
393
- Retrieves an access token using Meta's authentication API.
394
-
395
- Returns:
396
- str: A valid access token.
397
- """
398
-
399
- if self.access_token:
400
- return self.access_token
401
-
402
- url = "https://www.meta.ai/api/graphql/"
403
- payload = {
404
- "lsd": self.cookies["lsd"],
405
- "fb_api_caller_class": "RelayModern",
406
- "fb_api_req_friendly_name": "useAbraAcceptTOSForTempUserMutation",
407
- "variables": {
408
- "dob": "1999-01-01",
409
- "icebreaker_type": "TEXT",
410
- "__relay_internal__pv__WebPixelRatiorelayprovider": 1,
411
- },
412
- "doc_id": "7604648749596940",
413
- }
414
- payload = urllib.parse.urlencode(payload) # noqa
415
- headers = {
416
- "content-type": "application/x-www-form-urlencoded",
417
- "cookie": f'_js_datr={self.cookies["_js_datr"]}; '
418
- f'abra_csrf={self.cookies["abra_csrf"]}; datr={self.cookies["datr"]};',
419
- "sec-fetch-site": "same-origin",
420
- "x-fb-friendly-name": "useAbraAcceptTOSForTempUserMutation",
421
- }
422
-
423
- response = self.session.post(url, headers=headers, data=payload)
424
-
425
- try:
426
- auth_json = response.json()
427
- except json.JSONDecodeError:
428
- raise exceptions.FacebookRegionBlocked(
429
- "Unable to receive a valid response from Meta AI. This is likely due to your region being blocked. "
430
- "Try manually accessing https://www.meta.ai/ to confirm."
431
- )
432
-
433
- access_token = auth_json["data"]["xab_abra_accept_terms_of_service"][
434
- "new_temp_user_auth"
435
- ]["access_token"]
436
-
437
- # Need to sleep for a bit, for some reason the API doesn't like it when we send request too quickly
438
- # (maybe Meta needs to register Cookies on their side?)
439
- time.sleep(1)
440
-
441
- return access_token
442
-
443
- def ask(
444
- self,
445
- prompt: str,
446
- stream: bool = False,
447
- raw: bool = False,
448
- optimizer: str = None,
449
- conversationally: bool = False,
450
- ) -> Union[Dict, Generator[Dict, None, None]]:
451
- """
452
- Sends a message to the Meta AI and returns the response.
453
-
454
- Args:
455
- prompt (str): The prompt to send.
456
- stream (bool): Whether to stream the response or not. Defaults to False.
457
- raw (bool, optional): Stream back raw response as received. Defaults to False.
458
- optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
459
- conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
460
- Returns:
461
- Union[Dict, Generator[Dict, None, None]]: A dictionary containing the response message and sources, or a generator yielding such dictionaries.
462
- """
463
- conversation_prompt = self.conversation.gen_complete_prompt(prompt)
464
- if optimizer:
465
- if optimizer in self.__available_optimizers:
466
- conversation_prompt = getattr(Optimizers, optimizer)(
467
- conversation_prompt if conversationally else prompt
468
- )
469
- else:
470
- raise Exception(
471
- f"Optimizer is not one of {self.__available_optimizers}"
472
- )
473
-
474
- if not self.is_authed:
475
- self.access_token = self.get_access_token()
476
- auth_payload = {"access_token": self.access_token}
477
- url = "https://graph.meta.ai/graphql?locale=user"
478
-
479
- else:
480
- auth_payload = {"fb_dtsg": self.cookies["fb_dtsg"]}
481
- url = "https://www.meta.ai/api/graphql/"
482
-
483
- if not self.external_conversation_id:
484
- external_id = str(uuid.uuid4())
485
- self.external_conversation_id = external_id
486
- payload = {
487
- **auth_payload,
488
- "fb_api_caller_class": "RelayModern",
489
- "fb_api_req_friendly_name": "useAbraSendMessageMutation",
490
- "variables": json.dumps(
491
- {
492
- "message": {"sensitive_string_value": conversation_prompt},
493
- "externalConversationId": self.external_conversation_id,
494
- "offlineThreadingId": generate_offline_threading_id(),
495
- "suggestedPromptIndex": None,
496
- "flashVideoRecapInput": {"images": []},
497
- "flashPreviewInput": None,
498
- "promptPrefix": None,
499
- "entrypoint": "ABRA__CHAT__TEXT",
500
- "icebreaker_type": "TEXT",
501
- "__relay_internal__pv__AbraDebugDevOnlyrelayprovider": False,
502
- "__relay_internal__pv__WebPixelRatiorelayprovider": 1,
503
- }
504
- ),
505
- "server_timestamps": "true",
506
- "doc_id": "7783822248314888",
507
- }
508
- payload = urllib.parse.urlencode(payload) # noqa
509
- headers = {
510
- "content-type": "application/x-www-form-urlencoded",
511
- "x-fb-friendly-name": "useAbraSendMessageMutation",
512
- }
513
- if self.is_authed:
514
- headers["cookie"] = f'abra_sess={self.cookies["abra_sess"]}'
515
- # Recreate the session to avoid cookie leakage when user is authenticated
516
- self.session = requests.Session()
517
- self.session.proxies = self.proxy
518
-
519
- if stream:
520
-
521
- def for_stream():
522
- response = self.session.post(
523
- url, headers=headers, data=payload, stream=True, timeout=self.timeout
524
- )
525
- if not response.ok:
526
- raise exceptions.FailedToGenerateResponseError(
527
- f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
528
- )
529
-
530
- lines = response.iter_lines()
531
- is_error = json.loads(next(lines))
532
- if len(is_error.get("errors", [])) > 0:
533
- raise exceptions.FailedToGenerateResponseError(
534
- f"Failed to generate response - {response.text}"
535
- )
536
- for line in lines:
537
- if line:
538
- json_line = json.loads(line)
539
- extracted_data = self.extract_data(json_line)
540
- if not extracted_data.get("message"):
541
- continue
542
- self.last_response.update(extracted_data)
543
- yield line if raw else extracted_data
544
- self.conversation.update_chat_history(
545
- prompt, self.get_message(self.last_response)
546
- )
547
-
548
- return for_stream()
549
- else:
550
- response = self.session.post(
551
- url, headers=headers, data=payload, timeout=self.timeout
552
- )
553
- if not response.ok:
554
- raise exceptions.FailedToGenerateResponseError(
555
- f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
556
- )
557
- raw_response = response.text
558
- last_streamed_response = self.extract_last_response(raw_response)
559
- if not last_streamed_response:
560
- raise exceptions.FailedToGenerateResponseError(
561
- f"Failed to generate response - {response.text}"
562
- )
563
-
564
- extracted_data = self.extract_data(last_streamed_response)
565
- self.last_response.update(extracted_data)
566
- self.conversation.update_chat_history(
567
- prompt, self.get_message(self.last_response)
568
- )
569
- return extracted_data
570
-
571
- def chat(
572
- self,
573
- prompt: str,
574
- stream: bool = False,
575
- optimizer: str = None,
576
- conversationally: bool = False,
577
- ) -> str:
578
- """
579
- Sends a message to the Meta AI and returns the response.
580
-
581
- Args:
582
- prompt (str): The message to send.
583
- stream (bool): Whether to stream the response or not. Defaults to False.
584
- optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
585
- conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
586
-
587
- Returns:
588
- str: The response message.
589
- """
590
-
591
- def for_stream():
592
- for response in self.ask(
593
- prompt, True, optimizer=optimizer, conversationally=conversationally
594
- ):
595
- yield self.get_message(response)
596
-
597
- def for_non_stream():
598
- return self.get_message(
599
- self.ask(
600
- prompt,
601
- False,
602
- optimizer=optimizer,
603
- conversationally=conversationally,
604
- )
605
- )
606
-
607
- return for_stream() if stream else for_non_stream()
608
-
609
- def extract_last_response(self, response: str) -> Dict:
610
- """
611
- Extracts the last response from the Meta AI API.
612
-
613
- Args:
614
- response (str): The response to extract the last response from.
615
-
616
- Returns:
617
- dict: A dictionary containing the last response.
618
- """
619
- last_streamed_response = None
620
- for line in response.split("\n"):
621
- try:
622
- json_line = json.loads(line)
623
- except json.JSONDecodeError:
624
- continue
625
-
626
- bot_response_message = (
627
- json_line.get("data", {})
628
- .get("node", {})
629
- .get("bot_response_message", {})
630
- )
631
- chat_id = bot_response_message.get("id")
632
- if chat_id:
633
- external_conversation_id, offline_threading_id, _ = chat_id.split("_")
634
- self.external_conversation_id = external_conversation_id
635
- self.offline_threading_id = offline_threading_id
636
-
637
- streaming_state = bot_response_message.get("streaming_state")
638
- if streaming_state == "OVERALL_DONE":
639
- last_streamed_response = json_line
640
-
641
- return last_streamed_response
642
-
643
- def extract_data(self, json_line: dict) -> Dict:
644
- """
645
- Extract data and sources from a parsed JSON line.
646
-
647
- Args:
648
- json_line (dict): Parsed JSON line.
649
-
650
- Returns:
651
- dict: A dictionary containing the response message, sources, and media.
652
- """
653
- bot_response_message = (
654
- json_line.get("data", {}).get("node", {}).get("bot_response_message", {})
655
- )
656
- response = format_response(response=json_line)
657
- fetch_id = bot_response_message.get("fetch_id")
658
- sources = self.fetch_sources(fetch_id) if fetch_id else []
659
- medias = self.extract_media(bot_response_message)
660
- return {"message": response, "sources": sources, "media": medias}
661
-
662
- def extract_media(self, json_line: dict) -> List[Dict]:
663
- """
664
- Extract media from a parsed JSON line.
665
-
666
- Args:
667
- json_line (dict): Parsed JSON line.
668
-
669
- Returns:
670
- list: A list of dictionaries containing the extracted media.
671
- """
672
- medias = []
673
- imagine_card = json_line.get("imagine_card", {})
674
- session = imagine_card.get("session", {}) if imagine_card else {}
675
- media_sets = (
676
- (json_line.get("imagine_card", {}).get("session", {}).get("media_sets", []))
677
- if imagine_card and session
678
- else []
679
- )
680
- for media_set in media_sets:
681
- imagine_media = media_set.get("imagine_media", [])
682
- for media in imagine_media:
683
- medias.append(
684
- {
685
- "url": media.get("uri"),
686
- "type": media.get("media_type"),
687
- "prompt": media.get("prompt"),
688
- }
689
- )
690
- return medias
691
-
692
- def get_cookies(self) -> dict:
693
- """
694
- Extracts necessary cookies from the Meta AI main page.
695
-
696
- Returns:
697
- dict: A dictionary containing essential cookies.
698
- """
699
- headers = {}
700
- if self.fb_email is not None and self.fb_password is not None:
701
- fb_session = get_fb_session(self.fb_email, self.fb_password, self.proxy)
702
- headers = {"cookie": f"abra_sess={fb_session['abra_sess']}"}
703
-
704
- response = requests.get(
705
- "https://www.meta.ai/",
706
- headers=headers,
707
- proxies=self.proxy,
708
- )
709
-
710
- cookies = {
711
- "_js_datr": extract_value(
712
- response.text, start_str='_js_datr":{"value":"', end_str='",'
713
- ),
714
- "datr": extract_value(
715
- response.text, start_str='datr":{"value":"', end_str='",'
716
- ),
717
- "lsd": extract_value(
718
- response.text, start_str='"LSD",[],{"token":"', end_str='"}'
719
- ),
720
- "fb_dtsg": extract_value(
721
- response.text, start_str='DTSGInitData",[],{"token":"', end_str='"'
722
- ),
723
- }
724
-
725
- if len(headers) > 0:
726
- cookies["abra_sess"] = fb_session["abra_sess"]
727
- else:
728
- cookies["abra_csrf"] = extract_value(
729
- response.text, start_str='abra_csrf":{"value":"', end_str='",'
730
- )
731
- return cookies
732
-
733
- def fetch_sources(self, fetch_id: str) -> List[Dict]:
734
- """
735
- Fetches sources from the Meta AI API based on the given query.
736
-
737
- Args:
738
- fetch_id (str): The fetch ID to use for the query.
739
-
740
- Returns:
741
- list: A list of dictionaries containing the fetched sources.
742
- """
743
-
744
- url = "https://graph.meta.ai/graphql?locale=user"
745
- payload = {
746
- "access_token": self.access_token,
747
- "fb_api_caller_class": "RelayModern",
748
- "fb_api_req_friendly_name": "AbraSearchPluginDialogQuery",
749
- "variables": json.dumps({"abraMessageFetchID": fetch_id}),
750
- "server_timestamps": "true",
751
- "doc_id": "6946734308765963",
752
- }
753
-
754
- payload = urllib.parse.urlencode(payload) # noqa
755
-
756
- headers = {
757
- "authority": "graph.meta.ai",
758
- "accept-language": "en-US,en;q=0.9,fr-FR;q=0.8,fr;q=0.7",
759
- "content-type": "application/x-www-form-urlencoded",
760
- "cookie": f'dpr=2; abra_csrf={self.cookies.get("abra_csrf")}; datr={self.cookies.get("datr")}; ps_n=1; ps_l=1',
761
- "x-fb-friendly-name": "AbraSearchPluginDialogQuery",
762
- }
763
-
764
- response = self.session.post(url, headers=headers, data=payload)
765
- response_json = response.json()
766
- message = response_json.get("data", {}).get("message", {})
767
- search_results = (
768
- (response_json.get("data", {}).get("message", {}).get("searchResults"))
769
- if message
770
- else None
771
- )
772
- if search_results is None:
773
- return []
774
-
775
- references = search_results["references"]
776
- return references
777
-
778
- def get_message(self, response: dict) -> str:
779
- """Retrieves message only from response
780
-
781
- Args:
782
- response (dict): Response generated by `self.ask`
783
-
784
- Returns:
785
- str: Message extracted
786
- """
787
- assert isinstance(response, dict), "Response should be of dict data-type only"
788
- return response["message"]
789
-
790
- if __name__ == "__main__":
791
- Meta = Meta()
792
- ai = Meta.chat("hi")
793
- for chunk in ai:
794
- print(chunk, end="", flush=True)
1
+ import json
2
+ import logging
3
+ import time
4
+ import urllib
5
+ import uuid
6
+ from typing import Dict, Generator, Iterator, List, Union
7
+
8
+ import random
9
+ import requests
10
+ from webscout.scout import Scout
11
+
12
+ from webscout.AIutel import Optimizers
13
+ from webscout.AIutel import Conversation
14
+ from webscout.AIutel import AwesomePrompts, sanitize_stream
15
+ from webscout.AIbase import Provider
16
+ from webscout import exceptions
17
+ from webscout import LitAgent as Lit
18
+ MAX_RETRIES = 3
19
+
20
+ def generate_offline_threading_id() -> str:
21
+ """
22
+ Generates an offline threading ID.
23
+
24
+ Returns:
25
+ str: The generated offline threading ID.
26
+ """
27
+ # Maximum value for a 64-bit integer in Python
28
+ max_int = (1 << 64) - 1
29
+ mask22_bits = (1 << 22) - 1
30
+
31
+ # Function to get the current timestamp in milliseconds
32
+ def get_current_timestamp():
33
+ return int(time.time() * 1000)
34
+
35
+ # Function to generate a random 64-bit integer
36
+ def get_random_64bit_int():
37
+ return random.getrandbits(64)
38
+
39
+ # Combine timestamp and random value
40
+ def combine_and_mask(timestamp, random_value):
41
+ shifted_timestamp = timestamp << 22
42
+ masked_random = random_value & mask22_bits
43
+ return (shifted_timestamp | masked_random) & max_int
44
+
45
+ timestamp = get_current_timestamp()
46
+ random_value = get_random_64bit_int()
47
+ threading_id = combine_and_mask(timestamp, random_value)
48
+
49
+ return str(threading_id)
50
+
51
+
52
+ def extract_value(text: str, start_str: str, end_str: str) -> str:
53
+ """
54
+ Helper function to extract a specific value from the given text using a key.
55
+
56
+ Args:
57
+ text (str): The text from which to extract the value.
58
+ start_str (str): The starting key.
59
+ end_str (str): The ending key.
60
+
61
+ Returns:
62
+ str: The extracted value.
63
+ """
64
+ start = text.find(start_str) + len(start_str)
65
+ end = text.find(end_str, start)
66
+ return text[start:end]
67
+
68
+
69
+ def format_response(response: dict) -> str:
70
+ """
71
+ Formats the response from Meta AI to remove unnecessary characters.
72
+
73
+ Args:
74
+ response (dict): The dictionnary containing the response to format.
75
+
76
+ Returns:
77
+ str: The formatted response.
78
+ """
79
+ text = ""
80
+ for content in (
81
+ response.get("data", {})
82
+ .get("node", {})
83
+ .get("bot_response_message", {})
84
+ .get("composed_text", {})
85
+ .get("content", [])
86
+ ):
87
+ text += content["text"] + "\n"
88
+ return text
89
+
90
+
91
+ # Function to perform the login
92
+ def get_fb_session(email, password, proxies=None):
93
+ login_url = "https://mbasic.facebook.com/login/"
94
+ headers = {
95
+ "authority": "mbasic.facebook.com",
96
+ "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
97
+ "accept-language": "en-US,en;q=0.9",
98
+ "sec-ch-ua": '"Chromium";v="122", "Not(A:Brand";v="24", "Google Chrome";v="122"',
99
+ "sec-ch-ua-mobile": "?0",
100
+ "sec-ch-ua-platform": '"macOS"',
101
+ "sec-fetch-dest": "document",
102
+ "sec-fetch-mode": "navigate",
103
+ "sec-fetch-site": "none",
104
+ "sec-fetch-user": "?1",
105
+ "upgrade-insecure-requests": "1",
106
+ "user-agent": Lit().random(),
107
+ }
108
+ # Send the GET request
109
+ response = requests.get(login_url, headers=headers, proxies=proxies)
110
+
111
+ # Use Scout for parsing instead of BeautifulSoup
112
+ scout = Scout(response.text)
113
+
114
+ # Parse necessary parameters from the login form
115
+ lsd = scout.find_first('input[name="lsd"]').get('value')
116
+ jazoest = scout.find_first('input[name="jazoest"]').get('value')
117
+ li = scout.find_first('input[name="li"]').get('value')
118
+ m_ts = scout.find_first('input[name="m_ts"]').get('value')
119
+
120
+ # Define the URL and body for the POST request to submit the login form
121
+ post_url = "https://mbasic.facebook.com/login/device-based/regular/login/?refsrc=deprecated&lwv=100"
122
+ data = {
123
+ "lsd": lsd,
124
+ "jazoest": jazoest,
125
+ "m_ts": m_ts,
126
+ "li": li,
127
+ "try_number": "0",
128
+ "unrecognized_tries": "0",
129
+ "email": email,
130
+ "pass": password,
131
+ "login": "Log In",
132
+ "bi_xrwh": "0",
133
+ }
134
+
135
+ headers = {
136
+ "authority": "mbasic.facebook.com",
137
+ "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
138
+ "accept-language": "en-US,en;q=0.9",
139
+ "cache-control": "no-cache",
140
+ "content-type": "application/x-www-form-urlencoded",
141
+ "cookie": f"datr={response.cookies.get('datr')}; sb={response.cookies.get('sb')}; ps_n=1; ps_l=1",
142
+ "dpr": "2",
143
+ "origin": "https://mbasic.facebook.com",
144
+ "pragma": "no-cache",
145
+ "referer": "https://mbasic.facebook.com/login/",
146
+ "sec-fetch-site": "same-origin",
147
+ "sec-fetch-user": "?1",
148
+ "upgrade-insecure-requests": "1",
149
+ "user-agent": Lit().random(),
150
+ "viewport-width": "1728",
151
+ }
152
+
153
+ # Send the POST request
154
+ session = requests.session()
155
+ session.proxies = proxies
156
+
157
+ result = session.post(post_url, headers=headers, data=data)
158
+ if "sb" not in session.cookies:
159
+ raise exceptions.FacebookInvalidCredentialsException(
160
+ "Was not able to login to Facebook. Please check your credentials. "
161
+ "You may also have been rate limited. Try to connect to Facebook manually."
162
+ )
163
+
164
+ cookies = {
165
+ **result.cookies.get_dict(),
166
+ "sb": session.cookies["sb"],
167
+ "xs": session.cookies["xs"],
168
+ "fr": session.cookies["fr"],
169
+ "c_user": session.cookies["c_user"],
170
+ }
171
+
172
+ response_login = {
173
+ "cookies": cookies,
174
+ "headers": result.headers,
175
+ "response": response.text,
176
+ }
177
+ meta_ai_cookies = get_cookies()
178
+
179
+ url = "https://www.meta.ai/state/"
180
+
181
+ payload = f'__a=1&lsd={meta_ai_cookies["lsd"]}'
182
+ headers = {
183
+ "authority": "www.meta.ai",
184
+ "accept": "*/*",
185
+ "accept-language": "en-US,en;q=0.9",
186
+ "cache-control": "no-cache",
187
+ "content-type": "application/x-www-form-urlencoded",
188
+ "cookie": f'ps_n=1; ps_l=1; dpr=2; _js_datr={meta_ai_cookies["_js_datr"]}; abra_csrf={meta_ai_cookies["abra_csrf"]}; datr={meta_ai_cookies["datr"]};; ps_l=1; ps_n=1',
189
+ "origin": "https://www.meta.ai",
190
+ "pragma": "no-cache",
191
+ "referer": "https://www.meta.ai/",
192
+ "sec-fetch-mode": "cors",
193
+ "sec-fetch-site": "same-origin",
194
+ "user-agent": Lit().random(),
195
+ "viewport-width": "1728",
196
+ }
197
+
198
+ response = requests.request("POST", url, headers=headers, data=payload, proxies=proxies)
199
+
200
+ state = extract_value(response.text, start_str='"state":"', end_str='"')
201
+
202
+ url = f"https://www.facebook.com/oidc/?app_id=1358015658191005&scope=openid%20linking&response_type=code&redirect_uri=https%3A%2F%2Fwww.meta.ai%2Fauth%2F&no_universal_links=1&deoia=1&state={state}"
203
+ payload = {}
204
+ headers = {
205
+ "authority": "www.facebook.com",
206
+ "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
207
+ "accept-language": "en-US,en;q=0.9",
208
+ "cache-control": "no-cache",
209
+ "cookie": f"datr={response_login['cookies']['datr']}; sb={response_login['cookies']['sb']}; c_user={response_login['cookies']['c_user']}; xs={response_login['cookies']['xs']}; fr={response_login['cookies']['fr']}; m_page_voice={response_login['cookies']['m_page_voice']}; abra_csrf={meta_ai_cookies['abra_csrf']};",
210
+ "sec-fetch-dest": "document",
211
+ "sec-fetch-mode": "navigate",
212
+ "sec-fetch-site": "cross-site",
213
+ "sec-fetch-user": "?1",
214
+ "upgrade-insecure-requests": "1",
215
+ "user-agent": Lit().random(),
216
+ }
217
+ session = requests.session()
218
+ session.proxies = proxies
219
+ response = session.get(url, headers=headers, data=payload, allow_redirects=False)
220
+
221
+ next_url = response.headers["Location"]
222
+
223
+ url = next_url
224
+
225
+ payload = {}
226
+ headers = {
227
+ "User-Agent": Lit().random(),
228
+ "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8",
229
+ "Accept-Language": "en-US,en;q=0.5",
230
+ "Accept-Encoding": "gzip, deflate, br",
231
+ "Referer": "https://www.meta.ai/",
232
+ "Connection": "keep-alive",
233
+ "Cookie": f'dpr=2; abra_csrf={meta_ai_cookies["abra_csrf"]}; datr={meta_ai_cookies["_js_datr"]}',
234
+ "Upgrade-Insecure-Requests": "1",
235
+ "Sec-Fetch-Dest": "document",
236
+ "Sec-Fetch-Mode": "navigate",
237
+ "Sec-Fetch-Site": "cross-site",
238
+ "Sec-Fetch-User": "?1",
239
+ "TE": "trailers",
240
+ }
241
+ session.get(url, headers=headers, data=payload)
242
+ cookies = session.cookies.get_dict()
243
+ if "abra_sess" not in cookies:
244
+ raise exceptions.FacebookInvalidCredentialsException(
245
+ "Was not able to login to Facebook. Please check your credentials. "
246
+ "You may also have been rate limited. Try to connect to Facebook manually."
247
+ )
248
+ logging.info("Successfully logged in to Facebook.")
249
+ return cookies
250
+
251
+
252
+ def get_cookies(self) -> dict:
253
+ """
254
+ Extracts necessary cookies from the Meta AI main page.
255
+
256
+ Returns:
257
+ dict: A dictionary containing essential cookies.
258
+ """
259
+ headers = {}
260
+ if self.fb_email is not None and self.fb_password is not None:
261
+ fb_session = get_fb_session(self.fb_email, self.fb_password, self.proxy)
262
+ headers = {"cookie": f"abra_sess={fb_session['abra_sess']}"}
263
+
264
+ response = requests.get(
265
+ "https://www.meta.ai/",
266
+ headers=headers,
267
+ proxies=self.proxy,
268
+ )
269
+
270
+ cookies = {
271
+ "_js_datr": extract_value(
272
+ response.text, start_str='_js_datr":{"value":"', end_str='",'
273
+ ),
274
+ "datr": extract_value(
275
+ response.text, start_str='datr":{"value":"', end_str='",'
276
+ ),
277
+ "lsd": extract_value(
278
+ response.text, start_str='"LSD",[],{"token":"', end_str='"}'
279
+ ),
280
+ "fb_dtsg": extract_value(
281
+ response.text, start_str='DTSGInitData",[],{"token":"', end_str='"'
282
+ ),
283
+ }
284
+
285
+ if len(headers) > 0:
286
+ cookies["abra_sess"] = fb_session["abra_sess"]
287
+ else:
288
+ cookies["abra_csrf"] = extract_value(
289
+ response.text, start_str='abra_csrf":{"value":"', end_str='",'
290
+ )
291
+ return cookies
292
+
293
+ class Meta(Provider):
294
+ """
295
+ A class to interact with the Meta AI API to obtain and use access tokens for sending
296
+ and receiving messages from the Meta AI Chat API.
297
+ """
298
+
299
+ def __init__(
300
+ self,
301
+ fb_email: str = None,
302
+ fb_password: str = None,
303
+ proxy: dict = None,
304
+ is_conversation: bool = True,
305
+ max_tokens: int = 600,
306
+ timeout: int = 30,
307
+ intro: str = None,
308
+ filepath: str = None,
309
+ update_file: bool = True,
310
+ proxies: dict = {},
311
+ history_offset: int = 10250,
312
+ act: str = None,
313
+ ):
314
+ """
315
+ Initializes the Meta AI API with given parameters.
316
+
317
+ Args:
318
+ fb_email (str, optional): Your Facebook email address. Defaults to None.
319
+ fb_password (str, optional): Your Facebook password. Defaults to None.
320
+ proxy (dict, optional): Proxy settings for requests. Defaults to None.
321
+ is_conversation (bool, optional): Flag for chatting conversationally. Defaults to True.
322
+ max_tokens (int, optional): Maximum number of tokens to be generated upon completion. Defaults to 600.
323
+ timeout (int, optional): Http request timeout. Defaults to 30.
324
+ intro (str, optional): Conversation introductory prompt. Defaults to None.
325
+ filepath (str, optional): Path to file containing conversation history. Defaults to None.
326
+ update_file (bool, optional): Add new prompts and responses to the file. Defaults to True.
327
+ proxies (dict, optional): Http request proxies. Defaults to {}.
328
+ history_offset (int, optional): Limit conversation history to this number of last texts. Defaults to 10250.
329
+ act (str|int, optional): Awesome prompt key or index. (Used as intro). Defaults to None.
330
+ """
331
+ self.session = requests.Session()
332
+ self.session.headers.update(
333
+ {
334
+ "user-agent": Lit().random(),
335
+ }
336
+ )
337
+ self.access_token = None
338
+ self.fb_email = fb_email
339
+ self.fb_password = fb_password
340
+ self.proxy = proxy
341
+ if self.proxy and not self.check_proxy():
342
+ raise ConnectionError(
343
+ "Unable to connect to proxy. Please check your proxy settings."
344
+ )
345
+ self.is_conversation = is_conversation
346
+ self.max_tokens_to_sample = max_tokens
347
+ self.timeout = timeout
348
+ self.last_response = {}
349
+ self.is_authed = fb_password is not None and fb_email is not None
350
+ self.cookies = self.get_cookies()
351
+ self.external_conversation_id = None
352
+ self.offline_threading_id = None
353
+
354
+ self.__available_optimizers = (
355
+ method
356
+ for method in dir(Optimizers)
357
+ if callable(getattr(Optimizers, method)) and not method.startswith("__")
358
+ )
359
+ Conversation.intro = (
360
+ AwesomePrompts().get_act(
361
+ act, raise_not_found=True, default=None, case_insensitive=True
362
+ )
363
+ if act
364
+ else intro or Conversation.intro
365
+ )
366
+ self.conversation = Conversation(
367
+ is_conversation, self.max_tokens_to_sample, filepath, update_file
368
+ )
369
+ self.conversation.history_offset = history_offset
370
+ self.session.proxies = proxies
371
+
372
+ def check_proxy(self, test_url: str = "https://api.ipify.org/?format=json") -> bool:
373
+ """
374
+ Checks the proxy connection by making a request to a test URL.
375
+
376
+ Args:
377
+ test_url (str): A test site from which we check that the proxy is installed correctly.
378
+
379
+ Returns:
380
+ bool: True if the proxy is working, False otherwise.
381
+ """
382
+ try:
383
+ response = self.session.get(test_url, proxies=self.proxy, timeout=10)
384
+ if response.status_code == 200:
385
+ self.session.proxies = self.proxy
386
+ return True
387
+ return False
388
+ except requests.RequestException:
389
+ return False
390
+
391
+ def get_access_token(self) -> str:
392
+ """
393
+ Retrieves an access token using Meta's authentication API.
394
+
395
+ Returns:
396
+ str: A valid access token.
397
+ """
398
+
399
+ if self.access_token:
400
+ return self.access_token
401
+
402
+ url = "https://www.meta.ai/api/graphql/"
403
+ payload = {
404
+ "lsd": self.cookies["lsd"],
405
+ "fb_api_caller_class": "RelayModern",
406
+ "fb_api_req_friendly_name": "useAbraAcceptTOSForTempUserMutation",
407
+ "variables": {
408
+ "dob": "1999-01-01",
409
+ "icebreaker_type": "TEXT",
410
+ "__relay_internal__pv__WebPixelRatiorelayprovider": 1,
411
+ },
412
+ "doc_id": "7604648749596940",
413
+ }
414
+ payload = urllib.parse.urlencode(payload) # noqa
415
+ headers = {
416
+ "content-type": "application/x-www-form-urlencoded",
417
+ "cookie": f'_js_datr={self.cookies["_js_datr"]}; '
418
+ f'abra_csrf={self.cookies["abra_csrf"]}; datr={self.cookies["datr"]};',
419
+ "sec-fetch-site": "same-origin",
420
+ "x-fb-friendly-name": "useAbraAcceptTOSForTempUserMutation",
421
+ }
422
+
423
+ response = self.session.post(url, headers=headers, data=payload)
424
+
425
+ try:
426
+ auth_json = response.json()
427
+ except json.JSONDecodeError:
428
+ raise exceptions.FacebookRegionBlocked(
429
+ "Unable to receive a valid response from Meta AI. This is likely due to your region being blocked. "
430
+ "Try manually accessing https://www.meta.ai/ to confirm."
431
+ )
432
+
433
+ access_token = auth_json["data"]["xab_abra_accept_terms_of_service"][
434
+ "new_temp_user_auth"
435
+ ]["access_token"]
436
+
437
+ # Need to sleep for a bit, for some reason the API doesn't like it when we send request too quickly
438
+ # (maybe Meta needs to register Cookies on their side?)
439
+ time.sleep(1)
440
+
441
+ return access_token
442
+
443
+ def ask(
444
+ self,
445
+ prompt: str,
446
+ stream: bool = False,
447
+ raw: bool = False,
448
+ optimizer: str = None,
449
+ conversationally: bool = False,
450
+ ) -> Union[Dict, Generator[Dict, None, None]]:
451
+ """
452
+ Sends a message to the Meta AI and returns the response.
453
+
454
+ Args:
455
+ prompt (str): The prompt to send.
456
+ stream (bool): Whether to stream the response or not. Defaults to False.
457
+ raw (bool, optional): Stream back raw response as received. Defaults to False.
458
+ optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
459
+ conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
460
+ Returns:
461
+ Union[Dict, Generator[Dict, None, None]]: A dictionary containing the response message and sources, or a generator yielding such dictionaries.
462
+ """
463
+ conversation_prompt = self.conversation.gen_complete_prompt(prompt)
464
+ if optimizer:
465
+ if optimizer in self.__available_optimizers:
466
+ conversation_prompt = getattr(Optimizers, optimizer)(
467
+ conversation_prompt if conversationally else prompt
468
+ )
469
+ else:
470
+ raise Exception(
471
+ f"Optimizer is not one of {self.__available_optimizers}"
472
+ )
473
+
474
+ if not self.is_authed:
475
+ self.access_token = self.get_access_token()
476
+ auth_payload = {"access_token": self.access_token}
477
+ url = "https://graph.meta.ai/graphql?locale=user"
478
+
479
+ else:
480
+ auth_payload = {"fb_dtsg": self.cookies["fb_dtsg"]}
481
+ url = "https://www.meta.ai/api/graphql/"
482
+
483
+ if not self.external_conversation_id:
484
+ external_id = str(uuid.uuid4())
485
+ self.external_conversation_id = external_id
486
+ payload = {
487
+ **auth_payload,
488
+ "fb_api_caller_class": "RelayModern",
489
+ "fb_api_req_friendly_name": "useAbraSendMessageMutation",
490
+ "variables": json.dumps(
491
+ {
492
+ "message": {"sensitive_string_value": conversation_prompt},
493
+ "externalConversationId": self.external_conversation_id,
494
+ "offlineThreadingId": generate_offline_threading_id(),
495
+ "suggestedPromptIndex": None,
496
+ "flashVideoRecapInput": {"images": []},
497
+ "flashPreviewInput": None,
498
+ "promptPrefix": None,
499
+ "entrypoint": "ABRA__CHAT__TEXT",
500
+ "icebreaker_type": "TEXT",
501
+ "__relay_internal__pv__AbraDebugDevOnlyrelayprovider": False,
502
+ "__relay_internal__pv__WebPixelRatiorelayprovider": 1,
503
+ }
504
+ ),
505
+ "server_timestamps": "true",
506
+ "doc_id": "7783822248314888",
507
+ }
508
+ payload = urllib.parse.urlencode(payload) # noqa
509
+ headers = {
510
+ "content-type": "application/x-www-form-urlencoded",
511
+ "x-fb-friendly-name": "useAbraSendMessageMutation",
512
+ }
513
+ if self.is_authed:
514
+ headers["cookie"] = f'abra_sess={self.cookies["abra_sess"]}'
515
+ # Recreate the session to avoid cookie leakage when user is authenticated
516
+ self.session = requests.Session()
517
+ self.session.proxies = self.proxy
518
+
519
+ if stream:
520
+
521
+ def for_stream():
522
+ response = self.session.post(
523
+ url, headers=headers, data=payload, stream=True, timeout=self.timeout
524
+ )
525
+ if not response.ok:
526
+ raise exceptions.FailedToGenerateResponseError(
527
+ f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
528
+ )
529
+
530
+ lines = response.iter_lines()
531
+ is_error = json.loads(next(lines))
532
+ if len(is_error.get("errors", [])) > 0:
533
+ raise exceptions.FailedToGenerateResponseError(
534
+ f"Failed to generate response - {response.text}"
535
+ )
536
+ for line in lines:
537
+ if line:
538
+ json_line = json.loads(line)
539
+ extracted_data = self.extract_data(json_line)
540
+ if not extracted_data.get("message"):
541
+ continue
542
+ self.last_response.update(extracted_data)
543
+ yield line if raw else extracted_data
544
+ self.conversation.update_chat_history(
545
+ prompt, self.get_message(self.last_response)
546
+ )
547
+
548
+ return for_stream()
549
+ else:
550
+ response = self.session.post(
551
+ url, headers=headers, data=payload, timeout=self.timeout
552
+ )
553
+ if not response.ok:
554
+ raise exceptions.FailedToGenerateResponseError(
555
+ f"Failed to generate response - ({response.status_code}, {response.reason}) - {response.text}"
556
+ )
557
+ raw_response = response.text
558
+ last_streamed_response = self.extract_last_response(raw_response)
559
+ if not last_streamed_response:
560
+ raise exceptions.FailedToGenerateResponseError(
561
+ f"Failed to generate response - {response.text}"
562
+ )
563
+
564
+ extracted_data = self.extract_data(last_streamed_response)
565
+ self.last_response.update(extracted_data)
566
+ self.conversation.update_chat_history(
567
+ prompt, self.get_message(self.last_response)
568
+ )
569
+ return extracted_data
570
+
571
+ def chat(
572
+ self,
573
+ prompt: str,
574
+ stream: bool = False,
575
+ optimizer: str = None,
576
+ conversationally: bool = False,
577
+ ) -> str:
578
+ """
579
+ Sends a message to the Meta AI and returns the response.
580
+
581
+ Args:
582
+ prompt (str): The message to send.
583
+ stream (bool): Whether to stream the response or not. Defaults to False.
584
+ optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
585
+ conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
586
+
587
+ Returns:
588
+ str: The response message.
589
+ """
590
+
591
+ def for_stream():
592
+ for response in self.ask(
593
+ prompt, True, optimizer=optimizer, conversationally=conversationally
594
+ ):
595
+ yield self.get_message(response)
596
+
597
+ def for_non_stream():
598
+ return self.get_message(
599
+ self.ask(
600
+ prompt,
601
+ False,
602
+ optimizer=optimizer,
603
+ conversationally=conversationally,
604
+ )
605
+ )
606
+
607
+ return for_stream() if stream else for_non_stream()
608
+
609
+ def extract_last_response(self, response: str) -> Dict:
610
+ """
611
+ Extracts the last response from the Meta AI API.
612
+
613
+ Args:
614
+ response (str): The response to extract the last response from.
615
+
616
+ Returns:
617
+ dict: A dictionary containing the last response.
618
+ """
619
+ last_streamed_response = None
620
+ for line in response.split("\n"):
621
+ try:
622
+ json_line = json.loads(line)
623
+ except json.JSONDecodeError:
624
+ continue
625
+
626
+ bot_response_message = (
627
+ json_line.get("data", {})
628
+ .get("node", {})
629
+ .get("bot_response_message", {})
630
+ )
631
+ chat_id = bot_response_message.get("id")
632
+ if chat_id:
633
+ external_conversation_id, offline_threading_id, _ = chat_id.split("_")
634
+ self.external_conversation_id = external_conversation_id
635
+ self.offline_threading_id = offline_threading_id
636
+
637
+ streaming_state = bot_response_message.get("streaming_state")
638
+ if streaming_state == "OVERALL_DONE":
639
+ last_streamed_response = json_line
640
+
641
+ return last_streamed_response
642
+
643
+ def extract_data(self, json_line: dict) -> Dict:
644
+ """
645
+ Extract data and sources from a parsed JSON line.
646
+
647
+ Args:
648
+ json_line (dict): Parsed JSON line.
649
+
650
+ Returns:
651
+ dict: A dictionary containing the response message, sources, and media.
652
+ """
653
+ bot_response_message = (
654
+ json_line.get("data", {}).get("node", {}).get("bot_response_message", {})
655
+ )
656
+ response = format_response(response=json_line)
657
+ fetch_id = bot_response_message.get("fetch_id")
658
+ sources = self.fetch_sources(fetch_id) if fetch_id else []
659
+ medias = self.extract_media(bot_response_message)
660
+ return {"message": response, "sources": sources, "media": medias}
661
+
662
+ def extract_media(self, json_line: dict) -> List[Dict]:
663
+ """
664
+ Extract media from a parsed JSON line.
665
+
666
+ Args:
667
+ json_line (dict): Parsed JSON line.
668
+
669
+ Returns:
670
+ list: A list of dictionaries containing the extracted media.
671
+ """
672
+ medias = []
673
+ imagine_card = json_line.get("imagine_card", {})
674
+ session = imagine_card.get("session", {}) if imagine_card else {}
675
+ media_sets = (
676
+ (json_line.get("imagine_card", {}).get("session", {}).get("media_sets", []))
677
+ if imagine_card and session
678
+ else []
679
+ )
680
+ for media_set in media_sets:
681
+ imagine_media = media_set.get("imagine_media", [])
682
+ for media in imagine_media:
683
+ medias.append(
684
+ {
685
+ "url": media.get("uri"),
686
+ "type": media.get("media_type"),
687
+ "prompt": media.get("prompt"),
688
+ }
689
+ )
690
+ return medias
691
+
692
+ def get_cookies(self) -> dict:
693
+ """
694
+ Extracts necessary cookies from the Meta AI main page.
695
+
696
+ Returns:
697
+ dict: A dictionary containing essential cookies.
698
+ """
699
+ headers = {}
700
+ if self.fb_email is not None and self.fb_password is not None:
701
+ fb_session = get_fb_session(self.fb_email, self.fb_password, self.proxy)
702
+ headers = {"cookie": f"abra_sess={fb_session['abra_sess']}"}
703
+
704
+ response = requests.get(
705
+ "https://www.meta.ai/",
706
+ headers=headers,
707
+ proxies=self.proxy,
708
+ )
709
+
710
+ cookies = {
711
+ "_js_datr": extract_value(
712
+ response.text, start_str='_js_datr":{"value":"', end_str='",'
713
+ ),
714
+ "datr": extract_value(
715
+ response.text, start_str='datr":{"value":"', end_str='",'
716
+ ),
717
+ "lsd": extract_value(
718
+ response.text, start_str='"LSD",[],{"token":"', end_str='"}'
719
+ ),
720
+ "fb_dtsg": extract_value(
721
+ response.text, start_str='DTSGInitData",[],{"token":"', end_str='"'
722
+ ),
723
+ }
724
+
725
+ if len(headers) > 0:
726
+ cookies["abra_sess"] = fb_session["abra_sess"]
727
+ else:
728
+ cookies["abra_csrf"] = extract_value(
729
+ response.text, start_str='abra_csrf":{"value":"', end_str='",'
730
+ )
731
+ return cookies
732
+
733
+ def fetch_sources(self, fetch_id: str) -> List[Dict]:
734
+ """
735
+ Fetches sources from the Meta AI API based on the given query.
736
+
737
+ Args:
738
+ fetch_id (str): The fetch ID to use for the query.
739
+
740
+ Returns:
741
+ list: A list of dictionaries containing the fetched sources.
742
+ """
743
+
744
+ url = "https://graph.meta.ai/graphql?locale=user"
745
+ payload = {
746
+ "access_token": self.access_token,
747
+ "fb_api_caller_class": "RelayModern",
748
+ "fb_api_req_friendly_name": "AbraSearchPluginDialogQuery",
749
+ "variables": json.dumps({"abraMessageFetchID": fetch_id}),
750
+ "server_timestamps": "true",
751
+ "doc_id": "6946734308765963",
752
+ }
753
+
754
+ payload = urllib.parse.urlencode(payload) # noqa
755
+
756
+ headers = {
757
+ "authority": "graph.meta.ai",
758
+ "accept-language": "en-US,en;q=0.9,fr-FR;q=0.8,fr;q=0.7",
759
+ "content-type": "application/x-www-form-urlencoded",
760
+ "cookie": f'dpr=2; abra_csrf={self.cookies.get("abra_csrf")}; datr={self.cookies.get("datr")}; ps_n=1; ps_l=1',
761
+ "x-fb-friendly-name": "AbraSearchPluginDialogQuery",
762
+ }
763
+
764
+ response = self.session.post(url, headers=headers, data=payload)
765
+ response_json = response.json()
766
+ message = response_json.get("data", {}).get("message", {})
767
+ search_results = (
768
+ (response_json.get("data", {}).get("message", {}).get("searchResults"))
769
+ if message
770
+ else None
771
+ )
772
+ if search_results is None:
773
+ return []
774
+
775
+ references = search_results["references"]
776
+ return references
777
+
778
+ def get_message(self, response: dict) -> str:
779
+ """Retrieves message only from response
780
+
781
+ Args:
782
+ response (dict): Response generated by `self.ask`
783
+
784
+ Returns:
785
+ str: Message extracted
786
+ """
787
+ assert isinstance(response, dict), "Response should be of dict data-type only"
788
+ return response["message"]
789
+
790
+ if __name__ == "__main__":
791
+ Meta = Meta()
792
+ ai = Meta.chat("hi")
793
+ for chunk in ai:
794
+ print(chunk, end="", flush=True)