abstract-webtools 0.1.6.117__tar.gz → 0.1.6.119__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (48) hide show
  1. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/PKG-INFO +1 -1
  2. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/setup.py +1 -1
  3. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/abstract_usurpit.py +16 -5
  4. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools.egg-info/PKG-INFO +1 -1
  5. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/README.md +0 -0
  6. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/pyproject.toml +0 -0
  7. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/setup.cfg +0 -0
  8. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/__init__.py +0 -0
  9. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/abstract_webtools.py +0 -0
  10. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/big_user_agent_list.py +0 -0
  11. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/domain_identifier.py +0 -0
  12. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/extention_list.py +0 -0
  13. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/find_dirs.py +0 -0
  14. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/k2s_downloader.py +0 -0
  15. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/main.py +0 -0
  16. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/__init__.py +0 -0
  17. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/allss//.py" +0 -0
  18. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/cipherManager.py +0 -0
  19. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/crawlManager.py +0 -0
  20. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/crawlmgr2.py +0 -0
  21. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/curlMgr.py +0 -0
  22. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/domainManager.py +0 -0
  23. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/dynamicRateLimiter.py +0 -0
  24. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/get_test.py +0 -0
  25. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/linkManager/__init__.py +0 -0
  26. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/linkManager/linkManager.py +0 -0
  27. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/mySocketClient.py +0 -0
  28. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/networkManager.py +0 -0
  29. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/requestManager/__init__.py +0 -0
  30. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/requestManager/requestManager.py +0 -0
  31. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/seleniumManager.py +0 -0
  32. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/soupManager/__init__.py +0 -0
  33. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/soupManager/asoueces.py +0 -0
  34. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/soupManager/soupManager.py +0 -0
  35. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/sslManager.py +0 -0
  36. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/tlsAdapter.py +0 -0
  37. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/urlManager/__init__.py +0 -0
  38. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/urlManager/urlManager.py +0 -0
  39. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/userAgentManager.py +0 -0
  40. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/videoDownloader.py +0 -0
  41. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/managers/videoDownloader2.py +0 -0
  42. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/soup_gui.py +0 -0
  43. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/url_grabber.py +0 -0
  44. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools/url_grabber_new.py +0 -0
  45. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools.egg-info/SOURCES.txt +0 -0
  46. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools.egg-info/dependency_links.txt +0 -0
  47. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools.egg-info/requires.txt +0 -0
  48. {abstract_webtools-0.1.6.117 → abstract_webtools-0.1.6.119}/src/abstract_webtools.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: abstract_webtools
3
- Version: 0.1.6.117
3
+ Version: 0.1.6.119
4
4
  Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
5
5
  Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
6
6
  Author: putkoff
@@ -4,7 +4,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
4
4
  long_description = fh.read()
5
5
  setuptools.setup(
6
6
  name='abstract_webtools',
7
- version='0.1.6.117',
7
+ version='0.1.6.119',
8
8
  author='putkoff',
9
9
  author_email='partners@abstractendeavors.com',
10
10
  description='Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.',
@@ -9,13 +9,25 @@ from abstract_utilities import *
9
9
 
10
10
  # Import your custom classes/functions
11
11
  # from your_module import linkManager, get_soup_mgr
12
- def get_directory_from_url(url):
12
+ def make_directory(directory=None,path=None):
13
+ if directory==None:
14
+ directory=os.getcwd()
15
+ if path:
16
+ directory = os.path.join(base_dir,path)
17
+ os.makedirs(directory,exist_ok=True)
18
+ return directory
19
+ def get_domain_name_from_url(url):
13
20
  parsed_url = urlparse(url)
14
- netloc = parsed_url['netloc']
15
- directory_name = netloc.split('.')
21
+ netloc = parsed_url.netloc
22
+ parsed_spl = netloc.split('.')
23
+ directory_name = '.'.join(parsed_spl[:-1])
16
24
  if directory_name.startswith('www.'):
17
25
  directory_name = directory_name[len('www.'):]
18
26
  return directory_name
27
+ def get_domain_directory_from_url(url,base_dir=None):
28
+ base_dir =base_dir or os.getcwd()
29
+ domain_name = get_domain_name_from_url(url)
30
+ return make_directory(directory,domain_name)
19
31
  # Configuration
20
32
  def normalize_url(url, base_url):
21
33
  """
@@ -176,7 +188,6 @@ def test_download(url=None,directory=None):
176
188
  site_mgr = usurpManager(url,output_dir)
177
189
 
178
190
  def usurpit(url,output_dir=None,max_depth=None,wait_between_requests=None,operating_system=None, browser=None, version=None,user_agent=None,website_bot=None):
179
- output_dir= output_dir or get_directory_from_url(url) or os.path.join(os.getcwd(),'usurped')
180
- os.makedirs(output_dir,exist_ok=True)
191
+ output_dir = get_domain_name_from_url(url) or make_directory(path='usurped')
181
192
  site_mgr = usurpManager(url,output_dir=output_dir,max_depth=max_depth,wait_between_requests=wait_between_requests,operating_system=operating_system, browser=browser, version=version,user_agent=user_agent,website_bot=website_bot)
182
193
  site_mgr.main()
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: abstract_webtools
3
- Version: 0.1.6.117
3
+ Version: 0.1.6.119
4
4
  Summary: Abstract Web Tools is a Python package that provides various utility functions for web scraping tasks. It is built on top of popular libraries such as `requests`, `BeautifulSoup`, and `urllib3` to simplify the process of fetching and parsing web content.
5
5
  Home-page: https://github.com/AbstractEndeavors/abstract_essentials/tree/main/abstract_webtools
6
6
  Author: putkoff