waymore 4.0__tar.gz → 4.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {waymore-4.0/waymore.egg-info → waymore-4.2}/PKG-INFO +15 -3
- {waymore-4.0 → waymore-4.2}/README.md +14 -2
- waymore-4.2/waymore/__init__.py +1 -0
- {waymore-4.0 → waymore-4.2}/waymore/waymore.py +30 -23
- {waymore-4.0 → waymore-4.2/waymore.egg-info}/PKG-INFO +15 -3
- waymore-4.0/waymore/__init__.py +0 -1
- {waymore-4.0 → waymore-4.2}/LICENSE +0 -0
- {waymore-4.0 → waymore-4.2}/setup.cfg +0 -0
- {waymore-4.0 → waymore-4.2}/setup.py +0 -0
- {waymore-4.0 → waymore-4.2}/waymore.egg-info/SOURCES.txt +0 -0
- {waymore-4.0 → waymore-4.2}/waymore.egg-info/dependency_links.txt +0 -0
- {waymore-4.0 → waymore-4.2}/waymore.egg-info/entry_points.txt +0 -0
- {waymore-4.0 → waymore-4.2}/waymore.egg-info/requires.txt +0 -0
- {waymore-4.0 → waymore-4.2}/waymore.egg-info/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: waymore
|
|
3
|
-
Version: 4.
|
|
3
|
+
Version: 4.2
|
|
4
4
|
Summary: Find way more from the Wayback Machine, Common Crawl, Alien Vault OTX, URLScan & VirusTotal!
|
|
5
5
|
Home-page: https://github.com/xnl-h4ck3r/waymore
|
|
6
6
|
Author: @xnl-h4ck3r
|
|
@@ -16,7 +16,7 @@ Requires-Dist: tldextract
|
|
|
16
16
|
|
|
17
17
|
<center><img src="https://github.com/xnl-h4ck3r/waymore/blob/main/waymore/images/title.png"></center>
|
|
18
18
|
|
|
19
|
-
## About - v4.
|
|
19
|
+
## About - v4.2
|
|
20
20
|
|
|
21
21
|
The idea behind **waymore** is to find even more links from the Wayback Machine than other existing tools.
|
|
22
22
|
|
|
@@ -47,12 +47,24 @@ Now **waymore** gets URL's from ALL of those sources too (with ability to filter
|
|
|
47
47
|
|
|
48
48
|
`waymore` supports **Python 3**.
|
|
49
49
|
|
|
50
|
-
Install `waymore` in default(global) python environment.
|
|
50
|
+
Install `waymore` in default (global) python environment.
|
|
51
|
+
|
|
52
|
+
```bash
|
|
53
|
+
pip install waymore
|
|
54
|
+
```
|
|
55
|
+
|
|
56
|
+
OR
|
|
51
57
|
|
|
52
58
|
```bash
|
|
53
59
|
pip install git+https://github.com/xnl-h4ck3r/waymore.git -v
|
|
54
60
|
```
|
|
55
61
|
|
|
62
|
+
You can upgrade with
|
|
63
|
+
|
|
64
|
+
```bash
|
|
65
|
+
pip install --upgrade waymore
|
|
66
|
+
```
|
|
67
|
+
|
|
56
68
|
### pipx
|
|
57
69
|
|
|
58
70
|
Quick setup in isolated python environment using [pipx](https://pypa.github.io/pipx/)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
<center><img src="https://github.com/xnl-h4ck3r/waymore/blob/main/waymore/images/title.png"></center>
|
|
2
2
|
|
|
3
|
-
## About - v4.
|
|
3
|
+
## About - v4.2
|
|
4
4
|
|
|
5
5
|
The idea behind **waymore** is to find even more links from the Wayback Machine than other existing tools.
|
|
6
6
|
|
|
@@ -31,12 +31,24 @@ Now **waymore** gets URL's from ALL of those sources too (with ability to filter
|
|
|
31
31
|
|
|
32
32
|
`waymore` supports **Python 3**.
|
|
33
33
|
|
|
34
|
-
Install `waymore` in default(global) python environment.
|
|
34
|
+
Install `waymore` in default (global) python environment.
|
|
35
|
+
|
|
36
|
+
```bash
|
|
37
|
+
pip install waymore
|
|
38
|
+
```
|
|
39
|
+
|
|
40
|
+
OR
|
|
35
41
|
|
|
36
42
|
```bash
|
|
37
43
|
pip install git+https://github.com/xnl-h4ck3r/waymore.git -v
|
|
38
44
|
```
|
|
39
45
|
|
|
46
|
+
You can upgrade with
|
|
47
|
+
|
|
48
|
+
```bash
|
|
49
|
+
pip install --upgrade waymore
|
|
50
|
+
```
|
|
51
|
+
|
|
40
52
|
### pipx
|
|
41
53
|
|
|
42
54
|
Quick setup in isolated python environment using [pipx](https://pypa.github.io/pipx/)
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
__version__="4.2"
|
|
@@ -30,7 +30,6 @@ try:
|
|
|
30
30
|
from . import __version__
|
|
31
31
|
except:
|
|
32
32
|
pass
|
|
33
|
-
from tqdm import tqdm
|
|
34
33
|
|
|
35
34
|
# Try to import psutil to show memory usage
|
|
36
35
|
try:
|
|
@@ -1781,23 +1780,31 @@ def processWayBackPage(url):
|
|
|
1781
1780
|
return
|
|
1782
1781
|
|
|
1783
1782
|
# Get the URLs and MIME types. Each line is a separate JSON string
|
|
1784
|
-
|
|
1785
|
-
|
|
1786
|
-
|
|
1787
|
-
if verbose():
|
|
1788
|
-
try:
|
|
1789
|
-
linkMimes.add(str(results).split(' ')[2])
|
|
1790
|
-
except Exception as e:
|
|
1791
|
-
if verbose():
|
|
1792
|
-
writerr(colored(getSPACER('ERROR processWayBackPage 2: Cannot get MIME type from line: ' + str(line)),'red'))
|
|
1793
|
-
write(resp.text)
|
|
1794
|
-
try:
|
|
1783
|
+
try:
|
|
1784
|
+
for line in resp.iter_lines():
|
|
1785
|
+
results = line.decode("utf-8")
|
|
1795
1786
|
foundUrl = fixArchiveOrgUrl(str(results).split(' ')[1])
|
|
1796
|
-
|
|
1797
|
-
|
|
1798
|
-
|
|
1799
|
-
|
|
1800
|
-
|
|
1787
|
+
|
|
1788
|
+
# Check the URL exclusions
|
|
1789
|
+
match = re.search(r'('+re.escape(FILTER_URL).replace(',','|')+')', foundUrl, flags=re.IGNORECASE)
|
|
1790
|
+
if match is None:
|
|
1791
|
+
# Only get MIME Types if --verbose option was selected
|
|
1792
|
+
if verbose():
|
|
1793
|
+
try:
|
|
1794
|
+
linkMimes.add(str(results).split(' ')[2])
|
|
1795
|
+
except Exception as e:
|
|
1796
|
+
if verbose():
|
|
1797
|
+
writerr(colored(getSPACER('ERROR processWayBackPage 2: Cannot get MIME type from line: ' + str(line)),'red'))
|
|
1798
|
+
write(resp.text)
|
|
1799
|
+
try:
|
|
1800
|
+
linksFoundAdd(foundUrl)
|
|
1801
|
+
except Exception as e:
|
|
1802
|
+
if verbose():
|
|
1803
|
+
writerr(colored(getSPACER('ERROR processWayBackPage 3: Cannot get link from line: ' + str(line)),'red'))
|
|
1804
|
+
write(resp.text)
|
|
1805
|
+
except Exception as e:
|
|
1806
|
+
if verbose():
|
|
1807
|
+
writerr(colored(getSPACER('ERROR processWayBackPage 4: ' + str(line)),'red'))
|
|
1801
1808
|
else:
|
|
1802
1809
|
pass
|
|
1803
1810
|
except Exception as e:
|
|
@@ -2423,12 +2430,12 @@ def processResponses():
|
|
|
2423
2430
|
# This is useful for filtering out captures that are 'too dense' or when looking for unique captures."
|
|
2424
2431
|
if args.capture_interval == 'none': # get all
|
|
2425
2432
|
collapse = ''
|
|
2426
|
-
elif args.capture_interval == 'h': # get at most 1 capture per hour
|
|
2427
|
-
collapse = 'timestamp:10'
|
|
2428
|
-
elif args.capture_interval == 'd': # get at most 1 capture per day
|
|
2429
|
-
collapse = 'timestamp:8'
|
|
2430
|
-
elif args.capture_interval == 'm': # get at most 1 capture per month
|
|
2431
|
-
collapse = 'timestamp:6'
|
|
2433
|
+
elif args.capture_interval == 'h': # get at most 1 capture per URL per hour
|
|
2434
|
+
collapse = 'timestamp:10,original'
|
|
2435
|
+
elif args.capture_interval == 'd': # get at most 1 capture per URL per day
|
|
2436
|
+
collapse = 'timestamp:8,original'
|
|
2437
|
+
elif args.capture_interval == 'm': # get at most 1 capture per URL per month
|
|
2438
|
+
collapse = 'timestamp:6,original'
|
|
2432
2439
|
|
|
2433
2440
|
url = WAYBACK_URL.replace('{DOMAIN}',subs + quote(argsInput) + path).replace('{COLLAPSE}',collapse) + filterMIME + filterCode + filterLimit + filterFrom + filterTo + filterKeywords
|
|
2434
2441
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: waymore
|
|
3
|
-
Version: 4.
|
|
3
|
+
Version: 4.2
|
|
4
4
|
Summary: Find way more from the Wayback Machine, Common Crawl, Alien Vault OTX, URLScan & VirusTotal!
|
|
5
5
|
Home-page: https://github.com/xnl-h4ck3r/waymore
|
|
6
6
|
Author: @xnl-h4ck3r
|
|
@@ -16,7 +16,7 @@ Requires-Dist: tldextract
|
|
|
16
16
|
|
|
17
17
|
<center><img src="https://github.com/xnl-h4ck3r/waymore/blob/main/waymore/images/title.png"></center>
|
|
18
18
|
|
|
19
|
-
## About - v4.
|
|
19
|
+
## About - v4.2
|
|
20
20
|
|
|
21
21
|
The idea behind **waymore** is to find even more links from the Wayback Machine than other existing tools.
|
|
22
22
|
|
|
@@ -47,12 +47,24 @@ Now **waymore** gets URL's from ALL of those sources too (with ability to filter
|
|
|
47
47
|
|
|
48
48
|
`waymore` supports **Python 3**.
|
|
49
49
|
|
|
50
|
-
Install `waymore` in default(global) python environment.
|
|
50
|
+
Install `waymore` in default (global) python environment.
|
|
51
|
+
|
|
52
|
+
```bash
|
|
53
|
+
pip install waymore
|
|
54
|
+
```
|
|
55
|
+
|
|
56
|
+
OR
|
|
51
57
|
|
|
52
58
|
```bash
|
|
53
59
|
pip install git+https://github.com/xnl-h4ck3r/waymore.git -v
|
|
54
60
|
```
|
|
55
61
|
|
|
62
|
+
You can upgrade with
|
|
63
|
+
|
|
64
|
+
```bash
|
|
65
|
+
pip install --upgrade waymore
|
|
66
|
+
```
|
|
67
|
+
|
|
56
68
|
### pipx
|
|
57
69
|
|
|
58
70
|
Quick setup in isolated python environment using [pipx](https://pypa.github.io/pipx/)
|
waymore-4.0/waymore/__init__.py
DELETED
|
@@ -1 +0,0 @@
|
|
|
1
|
-
__version__="4.0"
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|