abstract-webtools 0.1.5.96__tar.gz → 0.1.5.98__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (34) hide show
  1. {abstract_webtools-0.1.5.96/src/abstract_webtools.egg-info → abstract_webtools-0.1.5.98}/PKG-INFO +1 -1
  2. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/setup.py +1 -1
  3. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/requestManager.py +2 -2
  4. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/soupManager.py +5 -5
  5. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98/src/abstract_webtools.egg-info}/PKG-INFO +1 -1
  6. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/LICENSE +0 -0
  7. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/README.md +0 -0
  8. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/pyproject.toml +0 -0
  9. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/setup.cfg +0 -0
  10. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/__init__.py +0 -0
  11. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/abstract_webtools.py +0 -0
  12. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/big_user_agent_list.py +0 -0
  13. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/main.py +0 -0
  14. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/__init__.py +0 -0
  15. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/cipherManager.py +0 -0
  16. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/crawlManager.py +0 -0
  17. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/domainManager.py +0 -0
  18. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/dynamicRateLimiter.py +0 -0
  19. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/linkManager.py +0 -0
  20. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/mySocketClient.py +0 -0
  21. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/networkManager.py +0 -0
  22. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/seleniumManager.py +0 -0
  23. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/sslManager.py +0 -0
  24. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/tlsAdapter.py +0 -0
  25. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/urlManager.py +0 -0
  26. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/userAgentManager.py +0 -0
  27. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/managers/videoDownloader.py +0 -0
  28. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/soup_gui.py +0 -0
  29. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/url_grabber.py +0 -0
  30. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools/url_grabber_new.py +0 -0
  31. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools.egg-info/SOURCES.txt +0 -0
  32. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools.egg-info/dependency_links.txt +0 -0
  33. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools.egg-info/requires.txt +0 -0
  34. {abstract_webtools-0.1.5.96 → abstract_webtools-0.1.5.98}/src/abstract_webtools.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: abstract_webtools
3
- Version: 0.1.5.96
3
+ Version: 0.1.5.98
4
4
  Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
5
5
  Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
6
6
  Author: putkoff
@@ -4,7 +4,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
4
4
  long_description = fh.read()
5
5
  setuptools.setup(
6
6
  name='abstract_webtools',
7
- version='0.1.5.96',
7
+ version='0.1.5.98',
8
8
  author='putkoff',
9
9
  author_email='partners@abstractendeavors.com',
10
10
  description='Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.',
@@ -341,10 +341,10 @@ class SafeRequestSingleton:
341
341
  elif SafeRequestSingleton._instance.url != url or SafeRequestSingleton._instance.headers != headers or SafeRequestSingleton._instance.max_retries != max_retries or SafeRequestSingleton._instance.request_wait_limit != request_wait_limit:
342
342
  SafeRequestSingleton._instance = SafeRequest(url,url_mgr=urlManagerSingleton,headers=headers,max_retries=max_retries,last_request_time=last_request_time,request_wait_limit=request_wait_limit)
343
343
  return SafeRequestSingleton._instance
344
- def get_req_mgr(url=None,url_mgr=None,source_code=None):
344
+ def get_req_mgr(url=None,url_mgr=None,source_code=None,req_mgr=None):
345
345
  url = get_url(url=url,url_mgr=url_mgr)
346
346
  url_mgr = get_url_mgr(url=url,url_mgr=url_mgr )
347
- req_mgr = requestManager(url_mgr=url_mgr,url=url,source_code=source_code)
347
+ req_mgr = req_mgr or requestManager(url_mgr=url_mgr,url=url,source_code=source_code)
348
348
  return req_mgr
349
349
  def get_source(url=None,url_mgr=None,source_code=None):
350
350
  # Placeholder for actual implementation.
@@ -279,21 +279,21 @@ class soupManager:
279
279
  attribute_names_list = list(attribute_names)
280
280
  return {"tags":tag_names_list,"attributes":attribute_names_list}
281
281
 
282
- def get_all_attribute_values(self, tag_list=None):
282
+ def get_all_attribute_values(self, tags_list=None):
283
283
  """
284
284
  Collects all attribute values for each specified tag or all tags if none are specified.
285
285
 
286
286
  Parameters:
287
- - tag_list: List of specific tags to retrieve attributes from, e.g., ['script', 'img'].
287
+ - tags_list: List of specific tags to retrieve attributes from, e.g., ['script', 'img'].
288
288
  If None, retrieves attributes for all tags.
289
289
 
290
290
  Returns:
291
291
  - attribute_values: Dictionary where each key is an attribute and the value is a list of unique values for that attribute.
292
292
  """
293
293
  attribute_values = {}
294
- tag_list = tag_list or self.all_tags_and_attributes
295
- # Get all tags matching tag_list criteria
296
- for tag_name in tag_list:
294
+ tags_list = tags_list or self.all_tags_and_attributes
295
+ # Get all tags matching tags_list criteria
296
+ for tag_name in tags_list:
297
297
  for tag in self.soup.find_all(tag_name):
298
298
  for attr, value in tag.attrs.items():
299
299
  if attr not in attribute_values:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: abstract_webtools
3
- Version: 0.1.5.96
3
+ Version: 0.1.5.98
4
4
  Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
5
5
  Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
6
6
  Author: putkoff