abstract-webtools 0.1.6.153__tar.gz → 0.1.6.154__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/PKG-INFO +1 -1
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/setup.py +1 -1
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/url_grabber.py +2 -51
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools.egg-info/PKG-INFO +1 -1
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/README.md +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/pyproject.toml +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/setup.cfg +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/__init__.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/abstract_usurpit.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/abstract_webtools.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/big_user_agent_list.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/domain_identifier.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/extention_list.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/find_dirs.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/k2s_downloader.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/main.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/__init__.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/allss.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/cipherManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/clownworld/__init__.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/clownworld/get_bolshevid_video.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/crawlManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/crawlmgr2.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/curlMgr.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/domainManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/dynamicRateLimiter.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/get_test.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/linkManager/__init__.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/linkManager/linkManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/meta_dump.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/middleManager/__init__.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/middleManager/imports.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/middleManager/src/UnifiedWebManage3r.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/middleManager/src/UnifiedWebManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/middleManager/src/__init__.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/middleManager/src/legacy_tools.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/mySocketClient.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/networkManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/requestManager/__init__.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/requestManager/requestManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/seleneumManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/seleniumManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/soupManager/__init__.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/soupManager/asoueces.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/soupManager/soupManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/sslManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/tlsAdapter.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/urlManager/__init__.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/urlManager/urlManager (Copy).py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/urlManager/urlManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/userAgentManager.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/videoDownloader.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/videoDownloader2.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/soup_gui.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/url_grabber_new.py +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools.egg-info/SOURCES.txt +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools.egg-info/dependency_links.txt +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools.egg-info/requires.txt +0 -0
- {abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: abstract_webtools
|
3
|
-
Version: 0.1.6.
|
3
|
+
Version: 0.1.6.154
|
4
4
|
Summary: Utilities for fetching/parsing web content with requests/urllib3/BS4 and helpers.
|
5
5
|
Home-page: https://github.com/AbstractEndeavors/abstract_webtools
|
6
6
|
Author: putkoff
|
@@ -5,7 +5,7 @@ README = Path("README.md").read_text(encoding="utf-8")
|
|
5
5
|
|
6
6
|
setup(
|
7
7
|
name="abstract_webtools",
|
8
|
-
version='0.1.6.
|
8
|
+
version='0.1.6.154', # bump once per release
|
9
9
|
author="putkoff",
|
10
10
|
author_email="partners@abstractendeavors.com",
|
11
11
|
description="Utilities for fetching/parsing web content with requests/urllib3/BS4 and helpers.",
|
{abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/url_grabber.py
RENAMED
@@ -1,7 +1,6 @@
|
|
1
1
|
from abstract_gui import make_component,sg
|
2
2
|
import inspect
|
3
3
|
import re
|
4
|
-
from . import UserAgentManager,UrlManager,SafeRequest,SoupManager,LinkManager,CipherManager,requests,ssl,BeautifulSoup,HTTPAdapter,PoolManager,ssl_
|
5
4
|
from .managers import *
|
6
5
|
window = None
|
7
6
|
|
@@ -26,7 +25,6 @@ def get_attrs(values):
|
|
26
25
|
else:
|
27
26
|
tags_js['attribute']=tags_js['attribute'][0]
|
28
27
|
return tags_js
|
29
|
-
|
30
28
|
def get_user_agent_mgr(user_agent=None):
|
31
29
|
return UserAgentManager(user_agent=user_agent)
|
32
30
|
def get_cipher_list():
|
@@ -130,10 +128,6 @@ def process_url(window,values):
|
|
130
128
|
if warn_url=='' or warn_url == None:
|
131
129
|
update_status(window,warn,warn_url,response_code,valid)
|
132
130
|
return False
|
133
|
-
temp_url=UrlManager(url=warn_url).url
|
134
|
-
if temp_url:
|
135
|
-
valid='valid'
|
136
|
-
response_code = SafeRequest(url=temp_mgr).response.status_code
|
137
131
|
temp_url=urlManager(url=warn_url).url
|
138
132
|
if temp_url:
|
139
133
|
valid='valid'
|
@@ -144,24 +138,7 @@ def process_url(window,values):
|
|
144
138
|
return temp_mgr
|
145
139
|
update_status(window,warn,warn_url,response_code,valid)
|
146
140
|
return False
|
147
|
-
def update_url(
|
148
|
-
ciphers = CipherManager(cipher_list=cipher_list).ciphers_string
|
149
|
-
request_manager = SafeRequest(url_manager=url_manager,ciphers=ciphers,user_agent=get_user_agents()[0])
|
150
|
-
if request_manager.source_code:
|
151
|
-
soup_manager= SoupManager(url_manager=url_manager,request_manager=request_manager)
|
152
|
-
link_manager= LinkManager(url_manager=url_manager,request_manager=request_manager,soup_manager=soup_manager)
|
153
|
-
window['-URL-'].update(value=url_manager.url)
|
154
|
-
window['-CIPHERS_OUTPUT-'].update(value=request_manager.ciphers)
|
155
|
-
return update_source_code(url_manager,request_manager,soup_manager,link_manager,values)
|
156
|
-
else:
|
157
|
-
return url_manager,request_manager,soup_manager,link_manager
|
158
|
-
def update_source_code(url_manager,request_manager,soup_manager,link_manager,values):
|
159
|
-
parse_type = values['-parse_type-']
|
160
|
-
if parse_type != soup_manager.parse_type:
|
161
|
-
soup_manager.update_parse_type(parse_type=parse_type)
|
162
|
-
all_tags=soup_manager.get_all_tags_and_attribute_names()
|
163
|
-
window['-SOURCECODE-'].update(value=soup_manager.soup)
|
164
|
-
window['-SOURCECODE-'].update(value=soup_manager.soupdef update_url(url_mgr,request_mgr,soup_mgr,link_mgr,values,cipher_list=get_cipher_list(),user_agent=get_user_agents()[0]):
|
141
|
+
def update_url(url_mgr,request_mgr,soup_mgr,link_mgr,values,cipher_list=get_cipher_list(),user_agent=get_user_agents()[0]):
|
165
142
|
ciphers = CipherManager(cipher_list=cipher_list).ciphers_string
|
166
143
|
request_mgr = requestManager(url_mgr=url_mgr,ciphers=ciphers,user_agent=get_user_agents()[0])
|
167
144
|
if request_mgr.source_code:
|
@@ -184,15 +161,7 @@ def update_source_code(url_mgr,request_mgr,soup_mgr,link_mgr,values):
|
|
184
161
|
window['-SOUP_ATTRIBUTE-'].update(values=all_tags['attributes'],value=all_tags['attributes'][0])
|
185
162
|
window['-SOUP_ATTRIBUTE_1-'].update(values=all_tags['attributes'],value=all_tags['attributes'][0])
|
186
163
|
window['-SOUP_ATTRIBUTE_2-'].update(values=all_tags['attributes'],value=all_tags['attributes'][0])
|
187
|
-
return
|
188
|
-
def url_grabber_while(window,initial_url="www.example.com"):
|
189
|
-
return_data=None
|
190
|
-
url_grab = False
|
191
|
-
url_manager=UrlManager(url=initial_url)
|
192
|
-
request_manager = SafeRequest(url_manager=url_manager)
|
193
|
-
soup_manager= SoupManager(url_manager=url_manager,request_manager=request_manager)
|
194
|
-
link_manager= LinkManager(url_manager=url_manager,request_manager=request_manager,soup_manager=soup_manager)
|
195
|
-
return url_mgr,request_mgr,soup_mgr,link_mgr
|
164
|
+
return url_mgr,request_mgr,soup_mgr,link_mgr
|
196
165
|
def url_grabber_while(window,initial_url="www.example.com"):
|
197
166
|
return_data=None
|
198
167
|
url_grab = False
|
@@ -206,16 +175,6 @@ def url_grabber_while(window,initial_url="www.example.com"):
|
|
206
175
|
break
|
207
176
|
if event=='-GRAB_URL-' or not url_grab:
|
208
177
|
url=values['-URL-']
|
209
|
-
if UrlManager(url=url).url:
|
210
|
-
if url != url_manager.url or url == initial_url:
|
211
|
-
url_manager = UrlManager(url=url)
|
212
|
-
|
213
|
-
url_manager,request_manager,soup_manager,link_manager=update_url(url_manager=url_manager,request_manager=request_manager,soup_manager=soup_manager,link_manager=link_manager,values=values)
|
214
|
-
window['-URL-'].update(value=url_manager.url)
|
215
|
-
url_grab=True
|
216
|
-
if event == 'get soup':
|
217
|
-
tags_js = get_attrs(values)
|
218
|
-
all_desired=soup_manager.find_tags_by_attributes(tag=tags_js['tag'], attr=tags_js['attribute'],attr_values=tags_js['input'])
|
219
178
|
if urlManager(url=url).url:
|
220
179
|
if url != url_mgr.url or url == initial_url:
|
221
180
|
url_mgr = urlManager(url=url)
|
@@ -230,18 +189,11 @@ def url_grabber_while(window,initial_url="www.example.com"):
|
|
230
189
|
if event == '-CUSTOMUA-':
|
231
190
|
window['-SOURCECODE-'].update(disabled=values['-CUSTOMUA-'])
|
232
191
|
if not values['-CUSTOMUA-']:
|
233
|
-
window['-USERAGENT-'].update(value=user_agent_manager.user_agent_header)
|
234
192
|
window['-USERAGENT-'].update(value=user_agent_mgr.user_agent_header)
|
235
193
|
window['-USERAGENT-'].update(disabled=True)
|
236
194
|
else:
|
237
195
|
window['-USERAGENT-'].update(disabled=False)
|
238
196
|
if event=='Get All Text':
|
239
|
-
window['-FIND_ALL_OUTPUT-'].update(value=soup_manager.extract_text_sections())
|
240
|
-
if event == 'Action':
|
241
|
-
parse_type = values['-parse_type-']
|
242
|
-
if parse_type != soup_manager.parse_type:
|
243
|
-
soup_manager.update_parse_type(parse_type=parse_type)
|
244
|
-
window['-SOURCECODE-'].update(value=soup_manager.soup)
|
245
197
|
window['-FIND_ALL_OUTPUT-'].update(value=soup_mgr.extract_text_sections())
|
246
198
|
if event == 'Action':
|
247
199
|
parse_type = values['-parse_type-']
|
@@ -258,4 +210,3 @@ def url_grabber_component(url=None):
|
|
258
210
|
url = "www.example.com"
|
259
211
|
globals()['window'] = make_component('Window','URL Grabber', layout=get_gpt_layout(url),**expandable())
|
260
212
|
return url_grabber_while(window,initial_url=url)
|
261
|
-
|
{abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools.egg-info/PKG-INFO
RENAMED
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: abstract_webtools
|
3
|
-
Version: 0.1.6.
|
3
|
+
Version: 0.1.6.154
|
4
4
|
Summary: Utilities for fetching/parsing web content with requests/urllib3/BS4 and helpers.
|
5
5
|
Home-page: https://github.com/AbstractEndeavors/abstract_webtools
|
6
6
|
Author: putkoff
|
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/__init__.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/extention_list.py
RENAMED
File without changes
|
{abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/find_dirs.py
RENAMED
File without changes
|
{abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/k2s_downloader.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/managers/allss.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/soup_gui.py
RENAMED
File without changes
|
{abstract_webtools-0.1.6.153 → abstract_webtools-0.1.6.154}/src/abstract_webtools/url_grabber_new.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|