bbot 2.4.2.6596rc0__py3-none-any.whl → 2.4.2.6608rc0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of bbot might be problematic. Click here for more details.

bbot/__init__.py CHANGED
@@ -1,5 +1,5 @@
1
1
  # version placeholder (replaced by poetry-dynamic-versioning)
2
- __version__ = "v2.4.2.6596rc"
2
+ __version__ = "v2.4.2.6608rc"
3
3
 
4
4
  from .scanner import Scanner, Preset
5
5
 
@@ -5,7 +5,7 @@ import time
5
5
  import inspect
6
6
  import regex as re
7
7
  from pathlib import Path
8
- from bbot.errors import ExcavateError
8
+ from bbot.errors import ExcavateError, ValidationError
9
9
  import bbot.core.helpers.regexes as bbot_regexes
10
10
  from bbot.modules.base import BaseInterceptModule
11
11
  from bbot.modules.internal.base import BaseInternalModule
@@ -622,14 +622,15 @@ class excavate(BaseInternalModule, BaseInterceptModule):
622
622
  base_url += f"?{event.parsed_url.query}"
623
623
  url = urljoin(base_url, endpoint)
624
624
 
625
+ try:
626
+ # Validate the URL before using it
627
+ parsed_url = self.excavate.helpers.validators.validate_url_parsed(url)
628
+ except (ValidationError, ValueError) as e:
629
+ self.excavate.debug(f"Invalid URL [{url}]: {e}")
630
+ continue
631
+
625
632
  if self.excavate.helpers.validate_parameter(parameter_name, parameter_type):
626
633
  if self.excavate.in_bl(parameter_name) is False:
627
- parsed_url = urlparse(url)
628
- if not parsed_url.hostname:
629
- self.excavate.warning(
630
- f"Error Parsing reconstructed URL [{url}] during parameter extraction, missing hostname"
631
- )
632
- continue
633
634
  description = f"HTTP Extracted Parameter [{parameter_name}] ({parameterExtractorSubModule.name} Submodule)"
634
635
  data = {
635
636
  "host": parsed_url.hostname,
@@ -848,45 +849,51 @@ class excavate(BaseInternalModule, BaseInterceptModule):
848
849
  urls_found = 0
849
850
  final_url = ""
850
851
  for url_str in results:
851
- if identifier == "url_full":
852
- if not await self.helpers.re.search(self.full_url_regex, url_str):
852
+ try:
853
+ if identifier == "url_full":
854
+ if not await self.helpers.re.search(self.full_url_regex, url_str):
855
+ self.excavate.debug(
856
+ f"Rejecting potential full URL [{url_str}] as did not match full_url_regex"
857
+ )
858
+ continue
859
+ final_url = url_str
860
+ self.excavate.debug(f"Discovered Full URL [{final_url}]")
861
+
862
+ elif identifier == "url_attr" and hasattr(event, "parsed_url"):
863
+ m = await self.helpers.re.search(self.tag_attribute_regex, url_str)
864
+ if not m:
865
+ self.excavate.debug(
866
+ f"Rejecting potential attribute URL [{url_str}] as did not match tag_attribute_regex"
867
+ )
868
+ continue
869
+ unescaped_url = html.unescape(m.group(1))
870
+ source_url = event.parsed_url.geturl()
871
+ final_url = urldefrag(urljoin(source_url, unescaped_url)).url
872
+ if not await self.helpers.re.search(self.full_url_regex_strict, final_url):
873
+ self.excavate.debug(
874
+ f"Rejecting reconstructed URL [{final_url}] as did not match full_url_regex_strict"
875
+ )
876
+ continue
853
877
  self.excavate.debug(
854
- f"Rejecting potential full URL [{url_str}] as did not match full_url_regex"
878
+ f"Reconstructed Full URL [{final_url}] from extracted relative URL [{unescaped_url}] "
855
879
  )
856
- continue
857
- final_url = url_str
858
880
 
859
- self.excavate.debug(f"Discovered Full URL [{final_url}]")
860
- elif identifier == "url_attr" and hasattr(event, "parsed_url"):
861
- m = await self.helpers.re.search(self.tag_attribute_regex, url_str)
862
- if not m:
863
- self.excavate.debug(
864
- f"Rejecting potential attribute URL [{url_str}] as did not match tag_attribute_regex"
881
+ if final_url:
882
+ # Validate the URL before using it
883
+ self.excavate.helpers.validators.validate_url_parsed(final_url)
884
+ if self.excavate.scan.in_scope(final_url):
885
+ urls_found += 1
886
+ await self.report(
887
+ final_url,
888
+ event,
889
+ yara_rule_settings,
890
+ discovery_context,
891
+ event_type="URL_UNVERIFIED",
892
+ urls_found=urls_found,
865
893
  )
866
- continue
867
- unescaped_url = html.unescape(m.group(1))
868
- source_url = event.parsed_url.geturl()
869
- final_url = urldefrag(urljoin(source_url, unescaped_url)).url
870
- if not await self.helpers.re.search(self.full_url_regex_strict, final_url):
871
- self.excavate.debug(
872
- f"Rejecting reconstructed URL [{final_url}] as did not match full_url_regex_strict"
873
- )
874
- continue
875
- self.excavate.debug(
876
- f"Reconstructed Full URL [{final_url}] from extracted relative URL [{unescaped_url}] "
877
- )
878
-
879
- if final_url:
880
- if self.excavate.scan.in_scope(final_url):
881
- urls_found += 1
882
- await self.report(
883
- final_url,
884
- event,
885
- yara_rule_settings,
886
- discovery_context,
887
- event_type="URL_UNVERIFIED",
888
- urls_found=urls_found,
889
- )
894
+ except (ValidationError, ValueError) as e:
895
+ self.excavate.debug(f"Invalid URL [{url_str if not final_url else final_url}]: {e}")
896
+ continue
890
897
 
891
898
  async def report_prep(self, event_data, event_type, event, tags, **kwargs):
892
899
  event_draft = self.excavate.make_event(event_data, event_type, parent=event)
@@ -1114,7 +1121,10 @@ class excavate(BaseInternalModule, BaseInterceptModule):
1114
1121
 
1115
1122
  # Check if rule processing function exists
1116
1123
  if rule_name in self.yara_preprocess_dict:
1117
- await self.yara_preprocess_dict[rule_name](result, event, discovery_context)
1124
+ try:
1125
+ await self.yara_preprocess_dict[rule_name](result, event, discovery_context)
1126
+ except ValidationError as e:
1127
+ self.debug(f"ValidationError in rule {rule_name} for result {result}: {e}")
1118
1128
  else:
1119
1129
  self.hugewarning(f"YARA Rule {rule_name} not found in pre-compiled rules")
1120
1130
 
@@ -22,7 +22,7 @@ class serial(BaseLightfuzz):
22
22
  CONTROL_PAYLOAD_PHP_RAW = "z:0:{}"
23
23
 
24
24
  BASE64_SERIALIZATION_PAYLOADS = {
25
- "php_base64": "YTowOnt9",
25
+ "php_base64": "YToxOntpOjA7aToxO30=",
26
26
  "java_base64": "rO0ABXNyABFqYXZhLmxhbmcuQm9vbGVhbs0gcoDVnPruAgABWgAFdmFsdWV4cAA=",
27
27
  "java_base64_string_error": "rO0ABXQABHRlc3Q=",
28
28
  "java_base64_OptionalDataException": "rO0ABXcEAAAAAAEAAAABc3IAEGphdmEudXRpbC5IYXNoTWFwAAAAAAAAAAECAAJMAARrZXkxYgABAAAAAAAAAAJ4cHcBAAAAB3QABHRlc3Q=",
@@ -1418,3 +1418,17 @@ class TestExcavateBadURLs(ModuleTestBase):
1418
1418
 
1419
1419
  url_events = [e for e in events if e.type == "URL_UNVERIFIED"]
1420
1420
  assert sorted([e.data for e in url_events]) == sorted(["https://ssl/", "http://127.0.0.1:8888/"])
1421
+
1422
+
1423
+ class TestExcavateURL_InvalidPort(TestExcavate):
1424
+ modules_overrides = ["excavate", "httpx", "hunt"]
1425
+
1426
+ async def setup_before_prep(self, module_test):
1427
+ # Test URL with invalid port (greater than 65535)
1428
+ module_test.httpserver.expect_request("/").respond_with_data(
1429
+ '<div><img loading="lazy" src="https://asdffoo.test.notreal:9212952841/whatever.jpg" width="576" height="382" alt="...." /></div>'
1430
+ )
1431
+
1432
+ def check(self, module_test, events):
1433
+ # Verify we got the hostname
1434
+ assert any(e.data == "asdffoo.test.notreal" for e in events)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: bbot
3
- Version: 2.4.2.6596rc0
3
+ Version: 2.4.2.6608rc0
4
4
  Summary: OSINT automation for hackers.
5
5
  License: GPL-3.0
6
6
  Keywords: python,cli,automation,osint,threat-intel,intelligence,neo4j,scanner,python-library,hacking,recursion,pentesting,recon,command-line-tool,bugbounty,subdomains,security-tools,subdomain-scanner,osint-framework,attack-surface,subdomain-enumeration,osint-tool
@@ -1,4 +1,4 @@
1
- bbot/__init__.py,sha256=f_lWfZIjwByTjeR_K-ytNiRjidI-4UQrBdUUWh9BFdk,163
1
+ bbot/__init__.py,sha256=f4ki_KyS_oJVQYdFblwwJ7F8FE7Xj0I-rDoOOdUzd9E,163
2
2
  bbot/cli.py,sha256=1QJbANVw9Q3GFM92H2QRV2ds5756ulm08CDZwzwPpeI,11888
3
3
  bbot/core/__init__.py,sha256=l255GJE_DvUnWvrRb0J5lG-iMztJ8zVvoweDOfegGtI,46
4
4
  bbot/core/config/__init__.py,sha256=zYNw2Me6tsEr8hOOkLb4BQ97GB7Kis2k--G81S8vofU,342
@@ -124,7 +124,7 @@ bbot/modules/internal/aggregate.py,sha256=HnnfTX2GYsOz8IFtfrRX1uXV6rvFx4uG9lmYJF
124
124
  bbot/modules/internal/base.py,sha256=BXO4Hc7XKaAOaLzolF3krJX1KibPxtek2GTQUgnCHk0,387
125
125
  bbot/modules/internal/cloudcheck.py,sha256=ay6MvZFbDvdhAlFPe_kEITM4wRsfRgQJf1DLBTcZ2jM,5138
126
126
  bbot/modules/internal/dnsresolve.py,sha256=1fwWChIGpSEIIkswueiIhEwIahQ7YngZ-njFK-RIsfU,15679
127
- bbot/modules/internal/excavate.py,sha256=dftFDjAJP8b0uiSQ-Y7oI3yVwZo3gPKWQlU3X2Db1Hk,63017
127
+ bbot/modules/internal/excavate.py,sha256=L8tGdfdvxrvfskC1Ms9UtSy-gxudnQcW7Iv5tHNAbW4,63728
128
128
  bbot/modules/internal/speculate.py,sha256=ua35Da-f0-fnK0oXtx4DeGJAT19bfqnmLfetSUfJnIk,9262
129
129
  bbot/modules/internal/unarchive.py,sha256=sA6KYQnhkyHq0mHwhRESHy9wkaRE43PjPkShWW0mOvM,3763
130
130
  bbot/modules/ip2location.py,sha256=yGivX9fzvwvLpnqmYCP2a8SPjTarzrZxfRluog-nkME,2628
@@ -139,7 +139,7 @@ bbot/modules/lightfuzz/submodules/cmdi.py,sha256=-9pL7Yh7VVCObxuS6Qu2cKEJBstfk0o
139
139
  bbot/modules/lightfuzz/submodules/crypto.py,sha256=mLWsMbcox9oruNjfdOaLmT7ePMH15K8JN9K5AIB8f8o,22560
140
140
  bbot/modules/lightfuzz/submodules/nosqli.py,sha256=K0TlBtpfeBH72q01a3TCQnt9OsznA9kfRYVTe7Vmers,9399
141
141
  bbot/modules/lightfuzz/submodules/path.py,sha256=cvfna9P5Cicmc3p3BrzlY0PG1slcvJkeMzZu4i2nwO0,7744
142
- bbot/modules/lightfuzz/submodules/serial.py,sha256=UgITHbo6p7FYb6bfAJ09xBKFj1tT-vIhRSftmcyyJH8,8516
142
+ bbot/modules/lightfuzz/submodules/serial.py,sha256=i3TdGV7M0G5thn1SFyKrod9nrm9UPV8kN3sd2-tvmEc,8528
143
143
  bbot/modules/lightfuzz/submodules/sqli.py,sha256=42TTB3UglMqnlxl7p2lUx14GWjbY9b6X7K9jWB5Mf9I,8486
144
144
  bbot/modules/lightfuzz/submodules/ssti.py,sha256=Pib49rXFuf567msnlec-A1Tnvolw4aILjqn7INLWQTY,1413
145
145
  bbot/modules/lightfuzz/submodules/xss.py,sha256=VP15TBeRjglIRjLvwmHJaOCNQOWS7R4WVAZ-VRNe198,9503
@@ -347,7 +347,7 @@ bbot/test/test_step_2/module_tests/test_module_dockerhub.py,sha256=9T8CFcFP32MOp
347
347
  bbot/test/test_step_2/module_tests/test_module_dotnetnuke.py,sha256=Q7M3hrbEwOuORZXPS-pIGFTRzB2-g4cEvGtsEcTp7t8,8049
348
348
  bbot/test/test_step_2/module_tests/test_module_emailformat.py,sha256=cKxBPnEQ4AiRKV_-hSYEE6756ypst3hi6MN0L5RTukY,461
349
349
  bbot/test/test_step_2/module_tests/test_module_emails.py,sha256=bZjtO8N3GG2_g6SUEYprAFLcsi7SlwNPJJ0nODfrWYU,944
350
- bbot/test/test_step_2/module_tests/test_module_excavate.py,sha256=loR5vmpmlJcO80bDX57uZumJh8qCZWqHe7GBA4b-p1w,60748
350
+ bbot/test/test_step_2/module_tests/test_module_excavate.py,sha256=hoVQnZYb_tI1FlxXRsPaGhk1qj8hyu1GgBEb7ByE3Q0,61336
351
351
  bbot/test/test_step_2/module_tests/test_module_extractous.py,sha256=PuTE5rkEIFPwU9lhCYpTgNSkrVjcXm8PClbfOkfRS84,17973
352
352
  bbot/test/test_step_2/module_tests/test_module_ffuf.py,sha256=z8ihAM1WYss7QGXIjbi67cekg8iOemDjaM8YR9_qSEs,4100
353
353
  bbot/test/test_step_2/module_tests/test_module_ffuf_shortnames.py,sha256=0-a9J-gq8bUtmxl_-QPVidwZ9KkCvgvoG30Ot3a8lqM,8406
@@ -450,8 +450,8 @@ bbot/wordlists/raft-small-extensions-lowercase_CLEANED.txt,sha256=ZSIVebs7ptMvHx
450
450
  bbot/wordlists/top_open_ports_nmap.txt,sha256=LmdFYkfapSxn1pVuQC2LkOIY2hMLgG-Xts7DVtYzweM,42727
451
451
  bbot/wordlists/valid_url_schemes.txt,sha256=0B_VAr9Dv7aYhwi6JSBDU-3M76vNtzN0qEC_RNLo7HE,3310
452
452
  bbot/wordlists/wordninja_dns.txt.gz,sha256=DYHvvfW0TvzrVwyprqODAk4tGOxv5ezNmCPSdPuDUnQ,570241
453
- bbot-2.4.2.6596rc0.dist-info/LICENSE,sha256=GzeCzK17hhQQDNow0_r0L8OfLpeTKQjFQwBQU7ZUymg,32473
454
- bbot-2.4.2.6596rc0.dist-info/METADATA,sha256=OsjFtdUM6w_FKP6FlYNmAhgYlnQTc8bOKqvOOYv4HfE,18308
455
- bbot-2.4.2.6596rc0.dist-info/WHEEL,sha256=fGIA9gx4Qxk2KDKeNJCbOEwSrmLtjWCwzBz351GyrPQ,88
456
- bbot-2.4.2.6596rc0.dist-info/entry_points.txt,sha256=cWjvcU_lLrzzJgjcjF7yeGuRA_eDS8pQ-kmPUAyOBfo,38
457
- bbot-2.4.2.6596rc0.dist-info/RECORD,,
453
+ bbot-2.4.2.6608rc0.dist-info/LICENSE,sha256=GzeCzK17hhQQDNow0_r0L8OfLpeTKQjFQwBQU7ZUymg,32473
454
+ bbot-2.4.2.6608rc0.dist-info/METADATA,sha256=ZB2AKLHmK3TscBywNyHDAqDpd25QDc90iPu5X_NDksI,18308
455
+ bbot-2.4.2.6608rc0.dist-info/WHEEL,sha256=fGIA9gx4Qxk2KDKeNJCbOEwSrmLtjWCwzBz351GyrPQ,88
456
+ bbot-2.4.2.6608rc0.dist-info/entry_points.txt,sha256=cWjvcU_lLrzzJgjcjF7yeGuRA_eDS8pQ-kmPUAyOBfo,38
457
+ bbot-2.4.2.6608rc0.dist-info/RECORD,,