abstract-webtools 0.1.6.8__tar.gz → 0.1.6.10__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (34) hide show
  1. {abstract_webtools-0.1.6.8/src/abstract_webtools.egg-info → abstract_webtools-0.1.6.10}/PKG-INFO +1 -1
  2. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/setup.py +1 -1
  3. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/crawlManager.py +4 -2
  4. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10/src/abstract_webtools.egg-info}/PKG-INFO +1 -1
  5. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/LICENSE +0 -0
  6. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/README.md +0 -0
  7. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/pyproject.toml +0 -0
  8. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/setup.cfg +0 -0
  9. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/__init__.py +0 -0
  10. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/abstract_webtools.py +0 -0
  11. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/big_user_agent_list.py +0 -0
  12. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/main.py +0 -0
  13. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/__init__.py +0 -0
  14. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/cipherManager.py +0 -0
  15. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/domainManager.py +0 -0
  16. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/dynamicRateLimiter.py +0 -0
  17. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/linkManager.py +0 -0
  18. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/mySocketClient.py +0 -0
  19. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/networkManager.py +0 -0
  20. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/requestManager.py +0 -0
  21. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/seleniumManager.py +0 -0
  22. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/soupManager.py +0 -0
  23. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/sslManager.py +0 -0
  24. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/tlsAdapter.py +0 -0
  25. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/urlManager.py +0 -0
  26. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/userAgentManager.py +0 -0
  27. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/managers/videoDownloader.py +0 -0
  28. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/soup_gui.py +0 -0
  29. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/url_grabber.py +0 -0
  30. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools/url_grabber_new.py +0 -0
  31. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools.egg-info/SOURCES.txt +0 -0
  32. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools.egg-info/dependency_links.txt +0 -0
  33. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools.egg-info/requires.txt +0 -0
  34. {abstract_webtools-0.1.6.8 → abstract_webtools-0.1.6.10}/src/abstract_webtools.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: abstract_webtools
3
- Version: 0.1.6.8
3
+ Version: 0.1.6.10
4
4
  Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
5
5
  Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
6
6
  Author: putkoff
@@ -4,7 +4,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
4
4
  long_description = fh.read()
5
5
  setuptools.setup(
6
6
  name='abstract_webtools',
7
- version='0.1.6.08',
7
+ version='0.1.6.10',
8
8
  author='putkoff',
9
9
  author_email='partners@abstractendeavors.com',
10
10
  description='Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.',
@@ -19,7 +19,7 @@ class crawlManager():
19
19
  attrs = 'href','src'
20
20
  unique_classes, images=discover_classes_and_images(self,tag_name,class_name_1,class_name_2,class_value,attrs)
21
21
  return unique_classes, images
22
- def extract_links_from_url(self):
22
+ def extract_links_from_url(self,url=None):
23
23
  """
24
24
  Extracts all href and src links from a given URL's source code.
25
25
 
@@ -29,6 +29,8 @@ class crawlManager():
29
29
  Returns:
30
30
  dict: Dictionary containing image links and external links under the parent page.
31
31
  """
32
+ url = url or self.url_mgr.url
33
+ soup_mgr = get_soup_mgr(url=url)
32
34
  agg_js = {'images':[],'external_links':[]}
33
35
 
34
36
  if self.response != None:
@@ -36,7 +38,7 @@ class crawlManager():
36
38
  href_links,src_links='',''
37
39
  links = [href_links,src_links]
38
40
  for i,each in enumerate(attrs):
39
- links[i]= [a[attr[i]] for a in get_find_all_with_attributes(self, attrs[i])]
41
+ links[i]= [a[attr[i]] for a in soup_mgr.get_find_all_with_attributes(attrs[i])]
40
42
  # Convert all links to absolute links
41
43
  absolute_links = [(url, link) for link in links[0] + links[1]]
42
44
  # Separate images and external links
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: abstract_webtools
3
- Version: 0.1.6.8
3
+ Version: 0.1.6.10
4
4
  Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
5
5
  Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
6
6
  Author: putkoff