PyPI - loghunter-cli - Versions diffs - 0.1.0.dev0__py3-none-any.whl - Mend

loghunter-cli 0.1.0.dev0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (122) hide show

loghunter/__init__.py +3 -0
loghunter/cli.py +1108 -0
loghunter/cli_init.py +567 -0
loghunter/common/__init__.py +1 -0
loghunter/common/allowlist.py +436 -0
loghunter/common/clustering.py +326 -0
loghunter/common/config.py +221 -0
loghunter/common/display.py +323 -0
loghunter/common/errors.py +45 -0
loghunter/common/finding.py +239 -0
loghunter/common/loader/__init__.py +136 -0
loghunter/common/loader/diagnostics.py +94 -0
loghunter/common/loader/discovery.py +335 -0
loghunter/common/loader/io.py +76 -0
loghunter/common/loader/pipeline.py +1010 -0
loghunter/common/loader/sniff.py +184 -0
loghunter/common/loader/types.py +207 -0
loghunter/common/loader/windowing.py +523 -0
loghunter/common/output.py +93 -0
loghunter/common/paths.py +105 -0
loghunter/common/sources.py +392 -0
loghunter/data/allowlist/connections.txt +50 -0
loghunter/data/allowlist/domains_devices.txt +5 -0
loghunter/data/allowlist/domains_homelab.txt +5 -0
loghunter/data/allowlist/domains_universal.txt +125 -0
loghunter/data/config_example.toml +144 -0
loghunter/detectors/__init__.py +5 -0
loghunter/detectors/auth.py +27 -0
loghunter/detectors/aws.py +671 -0
loghunter/detectors/beacon.py +258 -0
loghunter/detectors/dns.py +778 -0
loghunter/detectors/dnsblock.py +29 -0
loghunter/detectors/duration.py +178 -0
loghunter/detectors/protocol.py +26 -0
loghunter/detectors/scan.py +735 -0
loghunter/detectors/ssl.py +25 -0
loghunter/detectors/syslog.py +266 -0
loghunter/detectors/weird.py +27 -0
loghunter/digest/__init__.py +43 -0
loghunter/digest/_stats.py +182 -0
loghunter/digest/blob.py +698 -0
loghunter/digest/cloudtrail.py +341 -0
loghunter/digest/conn.py +367 -0
loghunter/digest/dns.py +364 -0
loghunter/digest/syslog.py +269 -0
loghunter/exporters/__init__.py +534 -0
loghunter/exporters/cloudtrail.py +499 -0
loghunter/exporters/splunk.py +222 -0
loghunter/outputs/__init__.py +1 -0
loghunter/outputs/allowlist.py +75 -0
loghunter/outputs/csv.py +70 -0
loghunter/outputs/email.py +44 -0
loghunter/outputs/html.py +99 -0
loghunter/outputs/json.py +77 -0
loghunter/outputs/text.py +1422 -0
loghunter/parsers/__init__.py +1 -0
loghunter/parsers/cloudtrail.py +287 -0
loghunter/parsers/dnsmasq.py +331 -0
loghunter/parsers/syslog.py +150 -0
loghunter/parsers/zeek.py +294 -0
loghunter/parsers/zeek_tsv.py +310 -0
loghunter/runner.py +1895 -0
loghunter_cli-0.1.0.dev0.dist-info/METADATA +336 -0
loghunter_cli-0.1.0.dev0.dist-info/RECORD +122 -0
loghunter_cli-0.1.0.dev0.dist-info/WHEEL +5 -0
loghunter_cli-0.1.0.dev0.dist-info/entry_points.txt +2 -0
loghunter_cli-0.1.0.dev0.dist-info/licenses/LICENSE +21 -0
loghunter_cli-0.1.0.dev0.dist-info/top_level.txt +4 -0
migrations/cloudtrail_parquet.py +59 -0
migrations/conn_fft.py +550 -0
migrations/conn_scan.py +1097 -0
migrations/dns_dbscan.py +520 -0
migrations/get_syslog.py +402 -0
migrations/syslog_drain3.py +479 -0
scratch/junk/parquet.py +59 -0
tests/__init__.py +1 -0
tests/_cloudtrail_fakes.py +116 -0
tests/conftest.py +17 -0
tests/test_allowlist_defaults_accessor.py +90 -0
tests/test_architecture_spine.py +302 -0
tests/test_aws_detector.py +504 -0
tests/test_be_like_water.py +106 -0
tests/test_cli_help.py +342 -0
tests/test_cli_multi_positional.py +458 -0
tests/test_cloudtrail_exporter.py +631 -0
tests/test_cloudtrail_exporter_botocore.py +207 -0
tests/test_cloudtrail_parser.py +393 -0
tests/test_clustering.py +85 -0
tests/test_clustering_interruptible.py +404 -0
tests/test_config_cli.py +1006 -0
tests/test_config_example_drift.py +164 -0
tests/test_digest_blob.py +1237 -0
tests/test_digest_cli.py +1040 -0
tests/test_digest_cloudtrail.py +980 -0
tests/test_digest_conn.py +1189 -0
tests/test_digest_dns.py +770 -0
tests/test_digest_stats.py +282 -0
tests/test_digest_syslog.py +724 -0
tests/test_display.py +370 -0
tests/test_dns_detector.py +1010 -0
tests/test_dnsmasq_parser.py +467 -0
tests/test_duration_detector.py +491 -0
tests/test_export_orchestrator_shape.py +153 -0
tests/test_init_wizard.py +707 -0
tests/test_loader.py +3639 -0
tests/test_loader_package_surface.py +115 -0
tests/test_loader_window_model.py +215 -0
tests/test_output_path_cascade.py +575 -0
tests/test_resolve_path.py +111 -0
tests/test_root_provenance.py +212 -0
tests/test_runner.py +2599 -0
tests/test_scan_detector.py +455 -0
tests/test_search_paths.py +50 -0
tests/test_sniff_orchestrator.py +373 -0
tests/test_sniff_recognizers.py +573 -0
tests/test_source_resolution_seam.py +471 -0
tests/test_sources.py +648 -0
tests/test_splunk_exporter.py +351 -0
tests/test_syslog_detector.py +458 -0
tests/test_syslog_parser.py +582 -0
tests/test_text_output.py +1225 -0
tests/test_zeek_tsv_parser.py +580 -0

tests/test_cli_help.py ADDED Viewed

@@ -0,0 +1,342 @@
+"""Per-command help, side-effect-light help short-circuit, and a few other
+parser-surface invariants that don't fit the verb-specific suites.
+Key promises locked here:
+  - ``loghunter <verb> --help`` / ``-h`` renders that verb's own generated help.
+  - Help fires BEFORE config load, output-registry lookup, sniff dispatch, or
+    init wizard entry.
+  - ``--help=anything`` and ``-h=anything`` are NOT help — they raise the
+    strict-parser "takes no value" error.
+  - ``loghunter conn.log`` (a real file in CWD) resolves as a path, not as an
+    unknown command.
+  - ``--output=FORMAT`` validates via the registered output handler list.
+"""
+from __future__ import annotations
+import sys
+from pathlib import Path
+import pytest
+from loghunter import cli
+from loghunter.common import config as cfg
+# ── per-command help renders from the spec ───────────────────────────────────
+@pytest.mark.parametrize("verb", [
+    "", "beacon", "dns", "syslog", "scan", "duration", "aws",
+    "digest", "export", "init",
+])
+def test_render_verb_help_lists_verb_allowed_flags(verb: str) -> None:
+    """Every flag in a verb's allowed set appears in its rendered help, and
+    no flag from outside the allowed set leaks in."""
+    rendered = cli._render_verb_help(verb)
+    vs = cli._VERBS[verb]
+    for spec in cli._FLAG_LIST:
+        if spec.key in vs.allowed:
+            assert spec.long in rendered, (
+                f"{spec.long} should be in {verb!r} help"
+            )
+            if spec.short:
+                assert f"-{spec.short}" in rendered
+        else:
+            assert spec.long not in rendered, (
+                f"{spec.long} should NOT be in {verb!r} help"
+            )
+def test_render_verb_help_blob_path_never_appears() -> None:
+    """``blob_path`` is an INTERNAL routing key — must not appear in any
+    rendered help. Padding the spec/allowed-set with it would silently mint
+    an unadvertised ``--blob-path`` ([[feedback-cli-surface-discipline]])."""
+    for verb in cli._VERBS:
+        rendered = cli._render_verb_help(verb)
+        assert "blob_path" not in rendered
+        assert "--blob-path" not in rendered
+        assert "-blob-path" not in rendered
+def test_init_help_only_lists_help(capsys: pytest.CaptureFixture[str]) -> None:
+    """init's allowed set is ``{help}`` — its rendered help mentions
+    ``--help`` and nothing else from the spec."""
+    rendered = cli._render_verb_help("init")
+    assert "--help" in rendered
+    for spec in cli._FLAG_LIST:
+        if spec.key != "help":
+            assert spec.long not in rendered
+# ── side-effect-light help: no config load, no sniff, no wizard ──────────────
+def test_verb_help_does_not_load_config(
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    """``<verb> --help`` short-circuits BEFORE cfg.load is called."""
+    def _exploding_load(_path=None):  # pragma: no cover — would only run on failure
+        raise RuntimeError("config must not load during help")
+    monkeypatch.setattr(cfg, "load", _exploding_load)
+    for argv in (
+        ["beacon", "--help"], ["beacon", "-h"],
+        ["digest", "--help"], ["digest", "-h"],
+        ["export", "--help"], ["init", "--help"],
+        ["--help"], ["-h"],
+    ):
+        rc = cli._main(argv)
+        assert rc == 0
+        capsys.readouterr()
+def test_init_help_does_not_start_wizard(
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    """``init -h`` must NOT enter the wizard (no run_init call, no input())."""
+    called = {"wizard": False}
+    def _spy_run_init():  # pragma: no cover — would only run on failure
+        called["wizard"] = True
+    monkeypatch.setattr("loghunter.cli_init.run_init", _spy_run_init)
+    rc = cli._main(["init", "-h"])
+    assert rc == 0
+    assert called["wizard"] is False
+    out = capsys.readouterr().out
+    assert "Usage: loghunter init" in out
+def test_digest_help_does_not_sniff(
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+    tmp_path: Path,
+) -> None:
+    """``digest --help`` must NOT call sniff_format_detailed even when a
+    positional is also passed."""
+    called = {"sniffed": False}
+    def _spy_sniff(_path):  # pragma: no cover — would only run on failure
+        called["sniffed"] = True
+        raise RuntimeError("sniff must not run during help")
+    monkeypatch.setattr(
+        "loghunter.common.loader.sniff_format_detailed", _spy_sniff,
+    )
+    pretend = tmp_path / "anything.log"
+    pretend.write_text("placeholder\n", encoding="utf-8")
+    rc = cli._main(["digest", str(pretend), "--help"])
+    assert rc == 0
+    assert called["sniffed"] is False
+def test_help_with_output_bogus_short_circuits_before_registry(
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    """``--help --output=bogus`` shows usage; the output registry is NEVER
+    consulted — the help short-circuit wins."""
+    monkeypatch.setattr(cfg, "SEARCH_PATHS", [])
+    def _exploding_get_handler(_name):  # pragma: no cover
+        raise RuntimeError("registry must not run during help")
+    monkeypatch.setattr("loghunter.cli.get_handler", _exploding_get_handler)
+    rc = cli._main(["beacon", "--help", "--output=bogus"])
+    assert rc == 0
+# ── --help=anything / -h=anything are NOT help ───────────────────────────────
+def test_help_with_value_raises_takes_no_value(
+    capsys: pytest.CaptureFixture[str],
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """``--help=foo`` is a value-on-bool error from the strict parser, not
+    a help short-circuit."""
+    monkeypatch.setattr(cfg, "SEARCH_PATHS", [])
+    with pytest.raises(SystemExit):
+        cli.main(["--help=foo"])
+    err = capsys.readouterr().err
+    assert "--help (-h) takes no value" in err
+def test_short_help_with_value_raises_takes_no_value(
+    capsys: pytest.CaptureFixture[str],
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    monkeypatch.setattr(cfg, "SEARCH_PATHS", [])
+    with pytest.raises(SystemExit):
+        cli.main(["-h=foo"])
+    err = capsys.readouterr().err
+    assert "--help (-h) takes no value" in err
+# ── loghunter conn.log (bare filename in CWD) ────────────────────────────────
+def test_bare_filename_in_cwd_routes_as_analyze_path(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    """A token that exists on disk routes to the analyze path (not 'unknown
+    command') even when it lacks the path-shape prefixes."""
+    monkeypatch.setattr(cfg, "SEARCH_PATHS", [])
+    monkeypatch.chdir(tmp_path)
+    captured: dict[str, object] = {}
+    def fake_run(**kwargs: object) -> None:
+        captured.update(kwargs)
+    monkeypatch.setattr("loghunter.runner.run", fake_run)
+    (tmp_path / "conn.log").write_text("", encoding="utf-8")
+    cli._main(["conn.log"])
+    # CLI now passes raw strings; the resolver owns Path conversion.
+    assert captured.get("zeek_dir") == "conn.log"
+# ── --output=FORMAT validation via the registry ──────────────────────────────
+def test_unknown_output_format_raises_with_available_list(
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+    tmp_path: Path,
+) -> None:
+    """``--output=bogus`` raises a CLI-formatted error with the registry's
+    live available-format list, not a hardcoded one."""
+    monkeypatch.setattr(cfg, "SEARCH_PATHS", [])
+    zeek_dir = tmp_path / "zeek"
+    zeek_dir.mkdir()
+    (zeek_dir / "conn.log").write_text("", encoding="utf-8")
+    with pytest.raises(SystemExit) as exc:
+        cli.main([f"--zeek-dir={zeek_dir}", "--output=bogus"])
+    assert exc.value.code == 1
+    err = capsys.readouterr().err
+    assert "Unknown output format 'bogus'." in err
+    assert "Available formats:" in err
+    # Built-in handlers must surface
+    for fmt in ("text", "json", "csv", "html"):
+        assert fmt in err
+def test_digest_unknown_output_format_uses_same_registry_error(
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+    tmp_path: Path,
+) -> None:
+    """Digest validates --output via the same registry — uniform error voice.
+    Registry check happens BEFORE digest's text-only rail, so ``--output=bogus``
+    reports 'Unknown output format', not 'currently supports only text'."""
+    monkeypatch.setattr(cfg, "SEARCH_PATHS", [])
+    log = tmp_path / "x.log"
+    log.write_text("", encoding="utf-8")
+    with pytest.raises(SystemExit) as exc:
+        cli.main(["digest", str(log), "--output=bogus"])
+    assert exc.value.code == 1
+    err = capsys.readouterr().err
+    assert "Unknown output format 'bogus'." in err
+# ── export positionals come from the parser ──────────────────────────────────
+def test_export_positionals_come_from_parser(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """``loghunter export splunk q1 q2`` consumes positionals from the
+    parser's ``paths`` list, not by re-scraping raw args."""
+    captured: dict = {}
+    def fake_run_export(**kwargs):
+        captured.update(kwargs)
+    monkeypatch.setattr("loghunter.exporters.run_export", fake_run_export)
+    monkeypatch.setattr(cfg, "load", lambda _=None: {
+        "export": {"splunk": {"host": "192.0.2.20", "port": 8089,
+                              "query": {"q1": {"spl": "x"}, "q2": {"spl": "y"}}}},
+    })
+    cli.main(["export", "splunk", "q1", "q2"])
+    assert captured["backend"] == "splunk"
+    assert captured["query_names"] == ["q1", "q2"]
+# ── digest combination guard (preserved) ─────────────────────────────────────
+def test_digest_path_plus_zeek_dir_still_rejected(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    """``digest PATH --zeek-dir=…`` is rejected (positional self-routes via
+    sniff). Bare digest with --zeek-dir is allowed — that's the bare-conn
+    config-driven path."""
+    monkeypatch.setattr(cfg, "load", lambda _=None: {"loghunter": {}})
+    log = tmp_path / "x.log"
+    log.write_text("", encoding="utf-8")
+    with pytest.raises(ValueError, match="--zeek-dir is not valid alongside"):
+        cli._main(["digest", str(log), "--zeek-dir=/x"])
+# ── bare short-form value flag mentions both spellings ───────────────────────
+def test_bare_short_value_flag_short_lead_message(
+    capsys: pytest.CaptureFixture[str],
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """A bare short value flag (``-o``) raises the actionable error mentioning
+    both ``-o=…`` and ``--out=…``."""
+    monkeypatch.setattr(cfg, "SEARCH_PATHS", [])
+    with pytest.raises(SystemExit) as exc:
+        cli.main(["-o"])
+    assert exc.value.code == 1
+    err = capsys.readouterr().err
+    assert "loghunter: --out (-o) needs a value: -o=… or --out=…" in err
+# ── --detect/-d on single-detector verbs raises wrong-verb ───────────────────
+def test_detect_on_single_detector_verb_raises_wrong_verb(
+    capsys: pytest.CaptureFixture[str],
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    monkeypatch.setattr(cfg, "SEARCH_PATHS", [])
+    with pytest.raises(SystemExit) as exc:
+        cli.main(["beacon", "--detect=all"])
+    assert exc.value.code == 1
+    err = capsys.readouterr().err
+    assert "--detect (-d) is not valid for beacon" in err
+def test_short_detect_on_single_detector_verb_raises_wrong_verb(
+    capsys: pytest.CaptureFixture[str],
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    monkeypatch.setattr(cfg, "SEARCH_PATHS", [])
+    with pytest.raises(SystemExit) as exc:
+        cli.main(["beacon", "-d=all"])
+    assert exc.value.code == 1
+    err = capsys.readouterr().err
+    assert "-d (--detect) is not valid for beacon" in err