abstract-webtools 0.1.6.116__tar.gz → 0.1.6.117__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/PKG-INFO +1 -1
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/setup.py +1 -1
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/abstract_usurpit.py +10 -3
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools.egg-info/PKG-INFO +1 -1
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/README.md +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/pyproject.toml +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/setup.cfg +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/__init__.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/abstract_webtools.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/big_user_agent_list.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/domain_identifier.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/extention_list.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/find_dirs.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/k2s_downloader.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/main.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/__init__.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/allss//.py" +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/cipherManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/crawlManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/crawlmgr2.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/curlMgr.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/domainManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/dynamicRateLimiter.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/get_test.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/linkManager/__init__.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/linkManager/linkManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/mySocketClient.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/networkManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/requestManager/__init__.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/requestManager/requestManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/seleniumManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/soupManager/__init__.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/soupManager/asoueces.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/soupManager/soupManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/sslManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/tlsAdapter.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/urlManager/__init__.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/urlManager/urlManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/userAgentManager.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/videoDownloader.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/managers/videoDownloader2.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/soup_gui.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/url_grabber.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/url_grabber_new.py +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools.egg-info/SOURCES.txt +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools.egg-info/dependency_links.txt +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools.egg-info/requires.txt +0 -0
- {abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: abstract_webtools
|
3
|
-
Version: 0.1.6.
|
3
|
+
Version: 0.1.6.117
|
4
4
|
Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
|
5
5
|
Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
|
6
6
|
Author: putkoff
|
@@ -4,7 +4,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
|
|
4
4
|
long_description = fh.read()
|
5
5
|
setuptools.setup(
|
6
6
|
name='abstract_webtools',
|
7
|
-
version='0.1.6.
|
7
|
+
version='0.1.6.117',
|
8
8
|
author='putkoff',
|
9
9
|
author_email='partners@abstractendeavors.com',
|
10
10
|
description='Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.',
|
@@ -9,7 +9,13 @@ from abstract_utilities import *
|
|
9
9
|
|
10
10
|
# Import your custom classes/functions
|
11
11
|
# from your_module import linkManager, get_soup_mgr
|
12
|
-
|
12
|
+
def get_directory_from_url(url):
|
13
|
+
parsed_url = urlparse(url)
|
14
|
+
netloc = parsed_url['netloc']
|
15
|
+
directory_name = netloc.split('.')
|
16
|
+
if directory_name.startswith('www.'):
|
17
|
+
directory_name = directory_name[len('www.'):]
|
18
|
+
return directory_name
|
13
19
|
# Configuration
|
14
20
|
def normalize_url(url, base_url):
|
15
21
|
"""
|
@@ -164,12 +170,13 @@ class usurpManager():
|
|
164
170
|
print("Website copying completed.")
|
165
171
|
def test_download(url=None,directory=None):
|
166
172
|
url=url or 'https://www.youtube.com/watch?v=jRGrNDV2mKc&list=RDMMjRGrNDV2mKc&start_radio=1'
|
167
|
-
|
173
|
+
|
174
|
+
output_dir= directory or get_directory_from_url(url) or os.path.join(os.getcwd(),'testit')
|
168
175
|
os.makedirs(output_dir,exist_ok=True)
|
169
176
|
site_mgr = usurpManager(url,output_dir)
|
170
177
|
|
171
178
|
def usurpit(url,output_dir=None,max_depth=None,wait_between_requests=None,operating_system=None, browser=None, version=None,user_agent=None,website_bot=None):
|
172
|
-
output_dir= output_dir or os.path.join(os.getcwd(),'usurped')
|
179
|
+
output_dir= output_dir or get_directory_from_url(url) or os.path.join(os.getcwd(),'usurped')
|
173
180
|
os.makedirs(output_dir,exist_ok=True)
|
174
181
|
site_mgr = usurpManager(url,output_dir=output_dir,max_depth=max_depth,wait_between_requests=wait_between_requests,operating_system=operating_system, browser=browser, version=version,user_agent=user_agent,website_bot=website_bot)
|
175
182
|
site_mgr.main()
|
{abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools.egg-info/PKG-INFO
RENAMED
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: abstract_webtools
|
3
|
-
Version: 0.1.6.
|
3
|
+
Version: 0.1.6.117
|
4
4
|
Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
|
5
5
|
Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
|
6
6
|
Author: putkoff
|
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/__init__.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/extention_list.py
RENAMED
File without changes
|
{abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/find_dirs.py
RENAMED
File without changes
|
{abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/k2s_downloader.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/soup_gui.py
RENAMED
File without changes
|
{abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/url_grabber.py
RENAMED
File without changes
|
{abstract_webtools-0.1.6.116 → abstract_webtools-0.1.6.117}/src/abstract_webtools/url_grabber_new.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|