waymore 4.0__tar.gz → 4.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: waymore
3
- Version: 4.0
3
+ Version: 4.2
4
4
  Summary: Find way more from the Wayback Machine, Common Crawl, Alien Vault OTX, URLScan & VirusTotal!
5
5
  Home-page: https://github.com/xnl-h4ck3r/waymore
6
6
  Author: @xnl-h4ck3r
@@ -16,7 +16,7 @@ Requires-Dist: tldextract
16
16
 
17
17
  <center><img src="https://github.com/xnl-h4ck3r/waymore/blob/main/waymore/images/title.png"></center>
18
18
 
19
- ## About - v4.0
19
+ ## About - v4.2
20
20
 
21
21
  The idea behind **waymore** is to find even more links from the Wayback Machine than other existing tools.
22
22
 
@@ -47,12 +47,24 @@ Now **waymore** gets URL's from ALL of those sources too (with ability to filter
47
47
 
48
48
  `waymore` supports **Python 3**.
49
49
 
50
- Install `waymore` in default(global) python environment.
50
+ Install `waymore` in default (global) python environment.
51
+
52
+ ```bash
53
+ pip install waymore
54
+ ```
55
+
56
+ OR
51
57
 
52
58
  ```bash
53
59
  pip install git+https://github.com/xnl-h4ck3r/waymore.git -v
54
60
  ```
55
61
 
62
+ You can upgrade with
63
+
64
+ ```bash
65
+ pip install --upgrade waymore
66
+ ```
67
+
56
68
  ### pipx
57
69
 
58
70
  Quick setup in isolated python environment using [pipx](https://pypa.github.io/pipx/)
@@ -1,6 +1,6 @@
1
1
  <center><img src="https://github.com/xnl-h4ck3r/waymore/blob/main/waymore/images/title.png"></center>
2
2
 
3
- ## About - v4.0
3
+ ## About - v4.2
4
4
 
5
5
  The idea behind **waymore** is to find even more links from the Wayback Machine than other existing tools.
6
6
 
@@ -31,12 +31,24 @@ Now **waymore** gets URL's from ALL of those sources too (with ability to filter
31
31
 
32
32
  `waymore` supports **Python 3**.
33
33
 
34
- Install `waymore` in default(global) python environment.
34
+ Install `waymore` in default (global) python environment.
35
+
36
+ ```bash
37
+ pip install waymore
38
+ ```
39
+
40
+ OR
35
41
 
36
42
  ```bash
37
43
  pip install git+https://github.com/xnl-h4ck3r/waymore.git -v
38
44
  ```
39
45
 
46
+ You can upgrade with
47
+
48
+ ```bash
49
+ pip install --upgrade waymore
50
+ ```
51
+
40
52
  ### pipx
41
53
 
42
54
  Quick setup in isolated python environment using [pipx](https://pypa.github.io/pipx/)
@@ -0,0 +1 @@
1
+ __version__="4.2"
@@ -30,7 +30,6 @@ try:
30
30
  from . import __version__
31
31
  except:
32
32
  pass
33
- from tqdm import tqdm
34
33
 
35
34
  # Try to import psutil to show memory usage
36
35
  try:
@@ -1781,23 +1780,31 @@ def processWayBackPage(url):
1781
1780
  return
1782
1781
 
1783
1782
  # Get the URLs and MIME types. Each line is a separate JSON string
1784
- for line in resp.iter_lines():
1785
- results = line.decode("utf-8")
1786
- # Only get MIME Types if --verbose option was selected
1787
- if verbose():
1788
- try:
1789
- linkMimes.add(str(results).split(' ')[2])
1790
- except Exception as e:
1791
- if verbose():
1792
- writerr(colored(getSPACER('ERROR processWayBackPage 2: Cannot get MIME type from line: ' + str(line)),'red'))
1793
- write(resp.text)
1794
- try:
1783
+ try:
1784
+ for line in resp.iter_lines():
1785
+ results = line.decode("utf-8")
1795
1786
  foundUrl = fixArchiveOrgUrl(str(results).split(' ')[1])
1796
- linksFoundAdd(foundUrl)
1797
- except Exception as e:
1798
- if verbose():
1799
- writerr(colored(getSPACER('ERROR processWayBackPage 3: Cannot get link from line: ' + str(line)),'red'))
1800
- write(resp.text)
1787
+
1788
+ # Check the URL exclusions
1789
+ match = re.search(r'('+re.escape(FILTER_URL).replace(',','|')+')', foundUrl, flags=re.IGNORECASE)
1790
+ if match is None:
1791
+ # Only get MIME Types if --verbose option was selected
1792
+ if verbose():
1793
+ try:
1794
+ linkMimes.add(str(results).split(' ')[2])
1795
+ except Exception as e:
1796
+ if verbose():
1797
+ writerr(colored(getSPACER('ERROR processWayBackPage 2: Cannot get MIME type from line: ' + str(line)),'red'))
1798
+ write(resp.text)
1799
+ try:
1800
+ linksFoundAdd(foundUrl)
1801
+ except Exception as e:
1802
+ if verbose():
1803
+ writerr(colored(getSPACER('ERROR processWayBackPage 3: Cannot get link from line: ' + str(line)),'red'))
1804
+ write(resp.text)
1805
+ except Exception as e:
1806
+ if verbose():
1807
+ writerr(colored(getSPACER('ERROR processWayBackPage 4: ' + str(line)),'red'))
1801
1808
  else:
1802
1809
  pass
1803
1810
  except Exception as e:
@@ -2423,12 +2430,12 @@ def processResponses():
2423
2430
  # This is useful for filtering out captures that are 'too dense' or when looking for unique captures."
2424
2431
  if args.capture_interval == 'none': # get all
2425
2432
  collapse = ''
2426
- elif args.capture_interval == 'h': # get at most 1 capture per hour
2427
- collapse = 'timestamp:10'
2428
- elif args.capture_interval == 'd': # get at most 1 capture per day
2429
- collapse = 'timestamp:8'
2430
- elif args.capture_interval == 'm': # get at most 1 capture per month
2431
- collapse = 'timestamp:6'
2433
+ elif args.capture_interval == 'h': # get at most 1 capture per URL per hour
2434
+ collapse = 'timestamp:10,original'
2435
+ elif args.capture_interval == 'd': # get at most 1 capture per URL per day
2436
+ collapse = 'timestamp:8,original'
2437
+ elif args.capture_interval == 'm': # get at most 1 capture per URL per month
2438
+ collapse = 'timestamp:6,original'
2432
2439
 
2433
2440
  url = WAYBACK_URL.replace('{DOMAIN}',subs + quote(argsInput) + path).replace('{COLLAPSE}',collapse) + filterMIME + filterCode + filterLimit + filterFrom + filterTo + filterKeywords
2434
2441
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: waymore
3
- Version: 4.0
3
+ Version: 4.2
4
4
  Summary: Find way more from the Wayback Machine, Common Crawl, Alien Vault OTX, URLScan & VirusTotal!
5
5
  Home-page: https://github.com/xnl-h4ck3r/waymore
6
6
  Author: @xnl-h4ck3r
@@ -16,7 +16,7 @@ Requires-Dist: tldextract
16
16
 
17
17
  <center><img src="https://github.com/xnl-h4ck3r/waymore/blob/main/waymore/images/title.png"></center>
18
18
 
19
- ## About - v4.0
19
+ ## About - v4.2
20
20
 
21
21
  The idea behind **waymore** is to find even more links from the Wayback Machine than other existing tools.
22
22
 
@@ -47,12 +47,24 @@ Now **waymore** gets URL's from ALL of those sources too (with ability to filter
47
47
 
48
48
  `waymore` supports **Python 3**.
49
49
 
50
- Install `waymore` in default(global) python environment.
50
+ Install `waymore` in default (global) python environment.
51
+
52
+ ```bash
53
+ pip install waymore
54
+ ```
55
+
56
+ OR
51
57
 
52
58
  ```bash
53
59
  pip install git+https://github.com/xnl-h4ck3r/waymore.git -v
54
60
  ```
55
61
 
62
+ You can upgrade with
63
+
64
+ ```bash
65
+ pip install --upgrade waymore
66
+ ```
67
+
56
68
  ### pipx
57
69
 
58
70
  Quick setup in isolated python environment using [pipx](https://pypa.github.io/pipx/)
@@ -1 +0,0 @@
1
- __version__="4.0"
File without changes
File without changes
File without changes