abstract-webtools 0.1.5.89__tar.gz → 0.1.5.91__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {abstract_webtools-0.1.5.89/src/abstract_webtools.egg-info → abstract_webtools-0.1.5.91}/PKG-INFO +1 -1
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/setup.py +1 -1
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/domainManager.py +4 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/requestManager.py +7 -8
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91/src/abstract_webtools.egg-info}/PKG-INFO +1 -1
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/LICENSE +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/README.md +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/pyproject.toml +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/setup.cfg +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/__init__.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/abstract_webtools.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/big_user_agent_list.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/main.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/__init__.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/cipherManager.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/crawlManager.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/dynamicRateLimiter.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/linkManager.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/mySocketClient.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/networkManager.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/seleniumManager.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/soupManager.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/sslManager.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/tlsAdapter.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/urlManager.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/userAgentManager.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/videoDownloader.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/soup_gui.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/url_grabber.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/url_grabber_new.py +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools.egg-info/SOURCES.txt +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools.egg-info/dependency_links.txt +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools.egg-info/requires.txt +0 -0
- {abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools.egg-info/top_level.txt +0 -0
{abstract_webtools-0.1.5.89/src/abstract_webtools.egg-info → abstract_webtools-0.1.5.91}/PKG-INFO
RENAMED
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: abstract_webtools
|
3
|
-
Version: 0.1.5.
|
3
|
+
Version: 0.1.5.91
|
4
4
|
Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
|
5
5
|
Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
|
6
6
|
Author: putkoff
|
@@ -4,7 +4,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
|
|
4
4
|
long_description = fh.read()
|
5
5
|
setuptools.setup(
|
6
6
|
name='abstract_webtools',
|
7
|
-
version='0.1.5.
|
7
|
+
version='0.1.5.91',
|
8
8
|
author='putkoff',
|
9
9
|
author_email='partners@abstractendeavors.com',
|
10
10
|
description='Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.',
|
@@ -6,6 +6,10 @@ class domainManager(metaclass=SingletonMeta):
|
|
6
6
|
parsed_url = urlparse(url)
|
7
7
|
self.domain = parsed_url.netloc
|
8
8
|
self.scheme = parsed_url.scheme
|
9
|
+
self.site_dir = os.path.join(os.getcwd(), self.domain)
|
10
|
+
os.makedirs(self.site_dir, exist_ok=True)
|
11
|
+
self.drivers = {}
|
12
|
+
self.page_type = []
|
9
13
|
def get_url_to_path(self, url):
|
10
14
|
url = eatAll(str(url),['',' ','\n','\t','\\','/'])
|
11
15
|
parsed_url = urlparse(url)
|
@@ -1,11 +1,12 @@
|
|
1
1
|
from ..abstract_webtools import *
|
2
|
-
|
2
|
+
|
3
3
|
from .userAgentManager import *
|
4
4
|
from .cipherManager import *
|
5
5
|
from .sslManager import *
|
6
6
|
from .tlsAdapter import *
|
7
7
|
from .networkManager import *
|
8
8
|
from .seleniumManager import *
|
9
|
+
from .urlManager import *
|
9
10
|
class requestManager:
|
10
11
|
"""
|
11
12
|
SafeRequest is a class for making HTTP requests with error handling and retries.
|
@@ -87,8 +88,8 @@ class requestManager:
|
|
87
88
|
last_request_time=None,
|
88
89
|
max_retries=None,
|
89
90
|
request_wait_limit=None):
|
90
|
-
self.
|
91
|
-
self.
|
91
|
+
self.url_mgr = get_url_mgr(url=url,url_mgr=url_mgr)
|
92
|
+
self.url=get_url(url=url,url_mgr=self.url_mgr)
|
92
93
|
self._url_mgr = self.url_mgr
|
93
94
|
self._url=self.url
|
94
95
|
self.user_agent = user_agent
|
@@ -340,12 +341,10 @@ class SafeRequestSingleton:
|
|
340
341
|
elif SafeRequestSingleton._instance.url != url or SafeRequestSingleton._instance.headers != headers or SafeRequestSingleton._instance.max_retries != max_retries or SafeRequestSingleton._instance.request_wait_limit != request_wait_limit:
|
341
342
|
SafeRequestSingleton._instance = SafeRequest(url,url_mgr=urlManagerSingleton,headers=headers,max_retries=max_retries,last_request_time=last_request_time,request_wait_limit=request_wait_limit)
|
342
343
|
return SafeRequestSingleton._instance
|
343
|
-
def get_req_mgr(
|
344
|
-
if req_mgr:
|
345
|
-
url_mgr = req_mgr.url_mgr
|
344
|
+
def get_req_mgr(url=None,url_mgr=None,source_code=None):
|
346
345
|
url = get_url(url=url,url_mgr=url_mgr)
|
347
|
-
url_mgr = get_url_mgr(url=url,url_mgr=url_mgr)
|
348
|
-
req_mgr =
|
346
|
+
url_mgr = get_url_mgr(url=url,url_mgr=url_mgr )
|
347
|
+
req_mgr = requestManager(url_mgr=url_mgr,url=url,source_code=source_code)
|
349
348
|
return req_mgr
|
350
349
|
def get_source(url=None,url_mgr=None,source_code=None):
|
351
350
|
# Placeholder for actual implementation.
|
{abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91/src/abstract_webtools.egg-info}/PKG-INFO
RENAMED
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: abstract_webtools
|
3
|
-
Version: 0.1.5.
|
3
|
+
Version: 0.1.5.91
|
4
4
|
Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
|
5
5
|
Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
|
6
6
|
Author: putkoff
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/abstract_webtools.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/managers/__init__.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/url_grabber.py
RENAMED
File without changes
|
{abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools/url_grabber_new.py
RENAMED
File without changes
|
{abstract_webtools-0.1.5.89 → abstract_webtools-0.1.5.91}/src/abstract_webtools.egg-info/SOURCES.txt
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|