npm - @inceptionstack/pi-hard-no - Versions diffs - 1.0.0 - Mend

@inceptionstack/pi-hard-no 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

package/default-review-rules.md ADDED Viewed

@@ -0,0 +1,150 @@
+## Correctness & Bugs
+- **Off-by-one errors**: wrong loop bounds (< vs <=, 0-indexed vs 1-indexed), fence-post errors in slicing/substring, incorrect range endpoints
+- **Null / undefined / nil access**: dereferencing values that can be absent, missing nil checks before member access, optional chaining gaps
+- **Type mismatches**: wrong argument types, implicit coercions that change behavior (string ↔ number, truthy/falsy surprises), incorrect casts
+- **Logic errors**: inverted conditions, wrong boolean operator (AND vs OR), negation errors, swapped arguments, wrong variable used in expression
+- **Boundary conditions**: empty collections, zero-length strings, negative numbers, integer overflow/underflow, maximum-size inputs
+- **Error handling**: missing error checks on fallible operations, swallowed exceptions, catch blocks that hide root causes, error paths that leave state inconsistent
+- **Resource leaks**: opened files/connections/handles never closed, missing cleanup in error paths, missing try-finally or equivalent
+- **Concurrency**: race conditions on shared mutable state, missing synchronization, non-atomic check-then-act patterns, deadlock potential
+- **Async correctness**: missing await on async calls, unhandled promise rejections, callbacks that can fire multiple times, event listener leaks
+- **Data flow**: variables written but never read, stale values used after mutation elsewhere, aliasing bugs where two references unexpectedly share state
+- **API contract violations**: passing values outside documented valid range, ignoring return values that signal errors, misusing library APIs
+- **Partial failure**: operations that can half-complete (write 3 of 5 records), leaving data in an inconsistent state — flag missing transactions or rollback logic
+- Each flagged bug must be **discrete and actionable** — identify the specific location, the trigger condition, and the concrete consequence
+- Do not speculate about what might break in other parts of the codebase without evidence — prove the issue from the code under review
+- Match the level of rigor to the codebase: do not demand production-grade defensive coding in one-off scripts or prototypes
+## Clean Architecture
+- Enforce dependency rule: dependencies point inward (UI → Application → Domain → Infrastructure inverts via ports)
+- Business logic must not depend on frameworks, databases, or external services directly
+- Use cases / application services must orchestrate domain objects, not contain domain logic themselves
+- Domain entities and value objects must be pure — no I/O, no framework imports
+- Adapters (controllers, repositories, gateways) must implement ports defined by inner layers
+- Flag any layer-skipping: UI calling infrastructure directly, domain importing from UI, etc.
+- Configuration and wiring belong at the composition root, not scattered across layers
+## SOLID Principles
+- **Single Responsibility**: each module/class/function should have one reason to change — flag god-classes and functions doing unrelated things
+- **Open/Closed**: prefer extension over modification — flag changes that require editing existing working code when a plugin/strategy/decorator pattern would suffice
+- **Liskov Substitution**: subtypes must be substitutable for their base types — flag overrides that narrow preconditions or weaken postconditions
+- **Interface Segregation**: clients should not depend on methods they don't use — flag fat interfaces that force implementors to stub unused methods
+- **Dependency Inversion**: high-level modules must not depend on low-level modules; both should depend on abstractions — flag direct instantiation of infrastructure in business logic
+## DRY — Don't Repeat Yourself
+- Flag duplicated logic across files (copy-paste code with minor variations)
+- Flag duplicated constants, magic numbers, and magic strings — extract to named constants
+- Flag repeated conditional patterns that should be polymorphism or lookup tables
+- Exception: test code may duplicate setup for readability — do not flag test helpers that are intentionally explicit
+## Clean Code
+- Functions should do one thing, do it well, and do it only
+- Functions should be short and operate at a single level of abstraction
+- Flag deep nesting (more than 2-3 levels) — suggest early returns or extraction
+- Flag functions with more than 3 parameters — suggest parameter objects
+- Flag boolean parameters that switch behavior — suggest separate functions
+- Names must reveal intent — flag cryptic abbreviations, single-letter variables (except conventional loop counters), and misleading names
+- Flag dead code: unreachable branches, unused variables, commented-out code
+- Flag side effects hidden in functions whose names suggest pure computation
+- Error handling must be explicit — flag swallowed exceptions, empty catch blocks, and generic error messages that hide root causes
+## Pragmatic Programmer
+- Flag violations of the principle of least surprise — code should behave as readers expect
+- Flag broken windows: sloppy code left alongside clean code signals that quality doesn't matter
+- Flag shotgun surgery: a single change requiring edits across many unrelated files
+- Flag feature envy: a function that uses more data from another module than its own
+- Prefer composition over inheritance — flag deep inheritance hierarchies (more than 2 levels)
+- Flag primitive obsession: using raw strings/numbers/booleans where a value object or enum would add safety
+- Orthogonality: modules should be independent — changing one should not require changing others
+## Documentation & Release Notes
+- A changelog file should exist at the project root (`CHANGELOG.md`, `CHANGES.md`, `HISTORY.md`, or equivalent) documenting user-visible changes
+- When a change modifies user-visible behavior (new feature, bug fix, breaking change, deprecation, notable behavior change), flag if the changelog has not been updated to describe it
+- Changelog entries should be concrete and specific: what changed, why it matters to the user, not just the commit summary
+- Internal-only changes (refactors with no behavior change, test-only updates, documentation-only updates, build/tooling changes) do not require a changelog entry — do not flag these
+- If no changelog file exists at all and the project has user-visible changes accumulating, flag that one should be created (suggest Keep a Changelog format or similar)
+- Version bumps in `package.json` or equivalent without a matching changelog entry are a smell — flag the mismatch
+## Domain-Driven Design
+- Ubiquitous language: code names should match domain terminology — flag technical jargon where domain terms exist
+- Bounded contexts must have clear boundaries — flag domain concepts leaking across context boundaries
+- Aggregates must enforce their own invariants — flag external code that manipulates aggregate internals directly
+- Value objects must be immutable — flag mutable value objects
+- Domain events should be used for cross-aggregate side effects, not direct coupling
+- Repositories must only exist for aggregate roots, not for every entity
+- Flag anemic domain models: entities that are just data bags with getters/setters while logic lives in services
+## Security — OWASP Top 10 (Web / General)
+- **Broken Access Control**: missing authorization checks, IDOR (direct object references without ownership validation), privilege escalation paths, missing CORS configuration
+- **Cryptographic Failures**: hardcoded secrets, API keys, passwords, or tokens in code; weak hashing (MD5, SHA1 for passwords); missing encryption for sensitive data at rest or in transit
+- **Injection**: SQL injection via string concatenation, command injection via unsanitized shell arguments, XSS via unescaped user input in HTML/templates, LDAP/XML/path injection
+- **Insecure Design**: missing rate limiting on sensitive endpoints, no account lockout, missing input validation at trust boundaries, business logic flaws
+- **Security Misconfiguration**: verbose error messages exposing internals, default credentials, unnecessary features enabled, missing security headers
+- **Vulnerable Components**: known-vulnerable dependency versions, unmaintained libraries, dependencies with known CVEs
+- **Authentication Failures**: weak password policies, missing MFA where appropriate, session tokens in URLs, missing session invalidation on logout/password change
+- **Data Integrity Failures**: missing integrity checks on critical data, unsigned/unverified updates, deserialization of untrusted data without validation
+- **Logging & Monitoring Failures**: missing audit logs for security-relevant actions, logging sensitive data (passwords, tokens, PII), insufficient error logging for incident response
+- **SSRF**: server-side requests using user-supplied URLs without allowlist validation, internal service URLs exposed
+## Security — OWASP Top 10 for LLM / AI Applications
+- **Prompt Injection**: user input concatenated directly into LLM prompts without sanitization, missing input/output boundaries, indirect injection via retrieved documents or tool outputs
+- **Sensitive Information Disclosure**: PII, credentials, or proprietary data included in prompts, model responses, or training data; missing output filtering; conversation history leaking across users
+- **Supply Chain Vulnerabilities**: untrusted model sources, unverified model weights, poisoned training data pipelines, compromised fine-tuning datasets
+- **Data and Model Poisoning**: training or fine-tuning on unvalidated user-generated content, no data provenance tracking, missing anomaly detection on training inputs
+- **Improper Output Handling**: LLM output used directly in SQL queries, shell commands, code execution, or HTML rendering without sanitization — treat all model output as untrusted
+- **Excessive Agency**: LLM given write/execute/delete capabilities without human-in-the-loop confirmation, missing scope restrictions on tool access, no action audit trail
+- **System Prompt Leakage**: system prompts retrievable via adversarial queries, sensitive instructions or architecture details in prompts, no prompt confidentiality controls
+- **Vector and Embedding Weaknesses**: RAG retrieval without access control (users retrieving documents they shouldn't see), embedding injection, poisoned vector store entries
+- **Misinformation**: no fact-checking or grounding for critical outputs, model hallucinations presented as authoritative, missing disclaimers on generated content
+- **Unbounded Consumption**: missing token/cost limits per request or user, recursive agent loops without caps, no rate limiting on AI endpoints
+## AI Trifecta — Critical AI Security Intersection
+- **Prompt Injection + Data Poisoning + Tool Use**: the most dangerous combination — poisoned retrieval data triggers prompt injection that invokes privileged tools; flag any path where untrusted data flows into prompts that have access to sensitive tools
+- Flag chains where: retrieval → prompt → tool execution has no trust boundary validation at each step
+- Flag missing sandboxing for AI-invoked code execution or file system access
+- Flag AI systems that can modify their own instructions, training data, or retrieval sources
+## Unit Testing — Osherove's Art of Unit Testing
+### Naming
+- Test names must describe: unit of work, scenario/input, and expected result
+- Pattern: `[UnitOfWork]_[Scenario]_[ExpectedBehavior]` or equivalent readable form
+- Flag cryptic test names like `test1`, `testIt`, `shouldWork`, or names that don't describe the scenario
+- Test names should read as specifications — a non-developer should understand what is being tested
+### Trustworthiness
+- Each test must have exactly one logical assertion (one reason to fail) — flag tests with multiple unrelated assertions
+- No logic in tests: no if/else, loops, switch, or try/catch in test code — these make tests unreliable
+- Flag tests that test implementation details (private methods, internal state) instead of observable behavior
+- Flag tests without assertions (passing tests that verify nothing)
+- Flag flaky patterns: time-dependent tests, order-dependent tests, tests sharing mutable state
+- Tests must fail for the right reason — flag assertions that would pass even if the code were broken
+### Readability
+- Tests should follow Arrange-Act-Assert (or Given-When-Then) structure clearly
+- Flag excessive setup that obscures what is being tested — prefer factory methods or builders
+- Flag shared mutable test fixtures — prefer fresh setup per test
+- Magic values must be explained or extracted to named constants
+- The entire test should be readable without scrolling — if it's long, it's testing too much
+### Maintainability
+- Flag over-mocking: tests that mock everything except the unit under test lose integration confidence
+- Flag brittle tests: tests that break when implementation changes but behavior doesn't
+- Flag test duplication: identical test logic copy-pasted across files — extract shared test utilities
+- Test helpers and custom matchers are encouraged when they improve clarity
+- Flag missing edge case tests for: null/empty inputs, boundary values, error paths, concurrent access

package/git-roots.ts ADDED Viewed

@@ -0,0 +1,94 @@
+/**
+ * git-roots.ts — Detect git repo roots from modified file paths
+ * Expands ~ to homedir for correct path resolution.
+ * Caches resolved roots to avoid repeated git calls.
+ */
+import { dirname, resolve, isAbsolute } from "node:path";
+import { homedir } from "node:os";
+import type { ExtensionAPI } from "@mariozechner/pi-coding-agent";
+/**
+ * Find the git repo root for a given directory.
+ * Returns null if not in a git repo.
+ */
+export async function findGitRoot(pi: ExtensionAPI, dir: string): Promise<string | null> {
+  try {
+    const result = await pi.exec("git", ["-C", dir, "rev-parse", "--show-toplevel"], {
+      timeout: 5000,
+    });
+    if (result.code === 0 && result.stdout.trim()) {
+      return result.stdout.trim();
+    }
+  } catch {
+    /* not in a git repo */
+  }
+  return null;
+}
+/**
+ * Given a set of modified file paths and pi's cwd, find all unique
+ * git repo roots that contain the modified files.
+ *
+ * Returns a map of gitRoot → list of files in that repo.
+ * Files not in any git repo are grouped under the key "(no-git)".
+ */
+export async function resolveGitRoots(
+  pi: ExtensionAPI,
+  cwd: string,
+  modifiedFiles: Set<string>,
+): Promise<Map<string, string[]>> {
+  const roots = new Map<string, string[]>();
+  const resolvedCache = new Map<string, string | null>(); // dir → gitRoot cache
+  for (const file of modifiedFiles) {
+    if (file === "(bash file op)") continue;
+    // Expand ~ to homedir
+    const expanded = file.startsWith("~/") ? resolve(homedir(), file.slice(2)) : file;
+    const absPath = isAbsolute(expanded) ? expanded : resolve(cwd, expanded);
+    const dir = dirname(absPath);
+    // Check cache first
+    let gitRoot: string | null | undefined = resolvedCache.get(dir);
+    if (gitRoot === undefined) {
+      gitRoot = await findGitRoot(pi, dir);
+      resolvedCache.set(dir, gitRoot);
+    }
+    const key = gitRoot ?? "(no-git)";
+    const list = roots.get(key) ?? [];
+    list.push(file);
+    roots.set(key, list);
+  }
+  // Also try cwd itself if no files resolved to repos
+  if (roots.size === 0) {
+    const cwdRoot = await findGitRoot(pi, cwd);
+    if (cwdRoot) {
+      roots.set(cwdRoot, []);
+    }
+  }
+  return roots;
+}
+/**
+ * Resolve all git roots from multiple sources:
+ * tracked modified files, tool call paths, and detected bash git roots.
+ */
+export async function resolveAllGitRoots(
+  pi: ExtensionAPI,
+  cwd: string,
+  modifiedFiles: Set<string>,
+  toolCallPaths: string[],
+  detectedGitRoots: Set<string>,
+): Promise<Set<string>> {
+  const allRoots = new Set(detectedGitRoots);
+  const combinedFiles = new Set([...modifiedFiles, ...toolCallPaths]);
+  const fileRoots = await resolveGitRoots(pi, cwd, combinedFiles);
+  for (const root of fileRoots.keys()) {
+    if (root !== "(no-git)") allRoots.add(root);
+  }
+  return allRoots;
+}

package/helpers.ts ADDED Viewed

@@ -0,0 +1,72 @@
+/**
+ * helpers.ts — Extracted pure functions for testability
+ */
+import { randomBytes } from "node:crypto";
+/**
+ * Generate a short unique ID for a review cycle.
+ * Format: `r-` + 8 lowercase hex chars (32 bits, ~4B possible values).
+ * Enough uniqueness for debugging/correlation within a session; not cryptographic.
+ */
+export function createReviewId(): string {
+  return `r-${randomBytes(4).toString("hex")}`;
+}
+/**
+ * Clamp requested commit count to available commits.
+ * Returns the effective count and whether it was clamped.
+ */
+export function clampCommitCount(
+  requested: number,
+  totalCommits: number,
+): { effectiveCount: number; wasClamped: boolean } {
+  if (totalCommits <= 0) {
+    return { effectiveCount: 0, wasClamped: true };
+  }
+  const effectiveCount = Math.min(requested, totalCommits);
+  return {
+    effectiveCount,
+    wasClamped: effectiveCount < requested,
+  };
+}
+/**
+ * Determine whether to diff against empty tree (all commits)
+ * or HEAD~N (partial history).
+ */
+export function shouldDiffAllCommits(effectiveCount: number, totalCommits: number): boolean {
+  return effectiveCount >= totalCommits;
+}
+/**
+ * Truncate a diff string to maxLen, appending a note if truncated.
+ */
+export function truncateDiff(diff: string, maxLen: number): string {
+  if (diff.length <= maxLen) return diff;
+  const omitted = diff.length - maxLen;
+  return diff.slice(0, maxLen) + `\n\n... (diff truncated, ${omitted} chars omitted)`;
+}
+/**
+ * Per-file budget (ms) for scaling the review timeout with file count.
+ * The reviewer spends time reading + reasoning about each file, so a multi-file
+ * review deserves proportionally more wall-clock budget.
+ */
+export const REVIEW_PER_FILE_BUDGET_MS = 120_000;
+/**
+ * Compute the effective wall-clock budget for a review run.
+ *
+ * Takes the larger of the user-configured minimum (`settings.reviewTimeoutMs`)
+ * and a per-file scaling factor (`fileCount * REVIEW_PER_FILE_BUDGET_MS`), so
+ * small reviews respect the user's floor and large reviews get enough headroom.
+ *
+ * Centralized here so changing the per-file factor or clamping logic happens
+ * in one place — previously this formula was duplicated in orchestrator.ts
+ * and commands.ts.
+ */
+export function computeReviewTimeoutMs(minTimeoutMs: number, fileCount: number): number {
+  const scaled = Math.max(0, fileCount) * REVIEW_PER_FILE_BUDGET_MS;
+  return Math.max(minTimeoutMs, scaled);
+}

package/ignore.ts ADDED Viewed

@@ -0,0 +1,105 @@
+/**
+ * ignore.ts — .hardno/ignore pattern matching
+ *
+ * Uses gitignore-style patterns:
+ *   - Blank lines and lines starting with # are ignored
+ *   - * matches anything except /
+ *   - ** matches everything including /
+ *   - ? matches a single character
+ *   - Patterns without / match the filename only
+ *   - Patterns with / match the full path
+ *   - Leading ! negates a pattern
+ *   - Trailing / means directory (treated as dir/**)
+ */
+import { basename } from "node:path";
+import { log } from "./logger";
+import { readConfigFile } from "./settings";
+/**
+ * Parse an ignore file into a list of patterns.
+ * Tries cwd/.hardno/ first, then ~/.pi/.hardno/.
+ */
+export async function loadIgnorePatterns(cwd: string): Promise<string[] | null> {
+  try {
+    const content = await readConfigFile(cwd, "ignore");
+    if (content === null) return null;
+    return parseIgnoreFile(content);
+  } catch (err: any) {
+    log(`Warning: could not read .hardno/ignore: ${err?.message}`);
+    return null;
+  }
+}
+/**
+ * Parse ignore file content into pattern strings.
+ */
+export function parseIgnoreFile(content: string): string[] {
+  return content
+    .split("\n")
+    .map((line) => line.trim())
+    .filter((line) => line.length > 0 && !line.startsWith("#"));
+}
+/**
+ * Convert a gitignore-style pattern to a RegExp.
+ * The pattern should NOT have a ! prefix (negation is handled by the caller).
+ */
+function patternToRegex(pattern: string): RegExp {
+  // Handle trailing / as directory pattern → dir/**
+  let p = pattern;
+  if (p.endsWith("/")) {
+    p = p.slice(0, -1) + "/**";
+  }
+  const matchFullPath = p.includes("/");
+  let regex = p
+    .replace(/([.+^${}()|[\]\\])/g, "\\$1")
+    .replace(/\*\*/g, "DOUBLESTAR")
+    .replace(/\*/g, "[^/]*")
+    .replace(/\?/g, "[^/]")
+    .replace(/DOUBLESTAR/g, ".*");
+  if (matchFullPath) {
+    if (regex.startsWith("/")) regex = regex.slice(1);
+    regex = `^${regex}$`;
+  } else {
+    regex = `(^|/)${regex}$`;
+  }
+  return new RegExp(regex);
+}
+/**
+ * Check if a file path should be ignored based on patterns.
+ * Follows gitignore semantics: last matching pattern wins, ! negates.
+ */
+export function shouldIgnore(filePath: string, patterns: string[]): boolean {
+  const name = basename(filePath);
+  const normalized = filePath.startsWith("./") ? filePath.slice(2) : filePath;
+  let ignored = false;
+  for (const pattern of patterns) {
+    const isNegated = pattern.startsWith("!");
+    const raw = isNegated ? pattern.slice(1) : pattern;
+    const regex = patternToRegex(raw);
+    const matchesPath = regex.test(normalized);
+    const matchesName = !raw.includes("/") && regex.test(name);
+    if (matchesPath || matchesName) {
+      ignored = !isNegated;
+    }
+  }
+  return ignored;
+}
+/**
+ * Filter a list of file paths, removing ignored ones.
+ */
+export function filterIgnored(files: string[], patterns: string[]): string[] {
+  return files.filter((f) => !shouldIgnore(f, patterns));
+}