npm - @oss-scout/core - Versions diffs - 0.10.0 → 1.0.0 - Mend

@oss-scout/core 0.10.0 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (64) hide show

package/dist/cli.bundle.cjs +77 -60
package/dist/cli.js +403 -416
package/dist/commands/command-scout.d.ts +21 -0
package/dist/commands/command-scout.js +21 -0
package/dist/commands/config.js +10 -128
package/dist/commands/features.js +15 -28
package/dist/commands/results.d.ts +13 -2
package/dist/commands/results.js +29 -2
package/dist/commands/search.d.ts +7 -0
package/dist/commands/search.js +63 -68
package/dist/commands/setup.d.ts +2 -0
package/dist/commands/setup.js +35 -6
package/dist/commands/skip.d.ts +4 -0
package/dist/commands/skip.js +45 -55
package/dist/commands/sync.d.ts +10 -0
package/dist/commands/sync.js +10 -0
package/dist/commands/vet-list.js +3 -19
package/dist/commands/vet.js +18 -25
package/dist/commands/with-scout.d.ts +32 -0
package/dist/commands/with-scout.js +41 -0
package/dist/core/anti-llm-policy.js +4 -5
package/dist/core/bootstrap.d.ts +2 -2
package/dist/core/bootstrap.js +5 -9
package/dist/core/errors.d.ts +10 -0
package/dist/core/errors.js +20 -5
package/dist/core/feature-discovery.d.ts +13 -1
package/dist/core/feature-discovery.js +104 -81
package/dist/core/gist-state-store.d.ts +13 -12
package/dist/core/gist-state-store.js +128 -53
package/dist/core/http-cache.d.ts +32 -2
package/dist/core/http-cache.js +74 -19
package/dist/core/issue-discovery.d.ts +3 -0
package/dist/core/issue-discovery.js +51 -31
package/dist/core/issue-eligibility.d.ts +10 -4
package/dist/core/issue-eligibility.js +119 -67
package/dist/core/issue-graphql.d.ts +58 -0
package/dist/core/issue-graphql.js +108 -0
package/dist/core/issue-vetting.d.ts +105 -8
package/dist/core/issue-vetting.js +234 -107
package/dist/core/local-state.d.ts +6 -2
package/dist/core/local-state.js +23 -5
package/dist/core/logger.d.ts +12 -4
package/dist/core/logger.js +33 -7
package/dist/core/personalization.d.ts +51 -18
package/dist/core/personalization.js +101 -27
package/dist/core/preference-fields.d.ts +47 -0
package/dist/core/preference-fields.js +178 -0
package/dist/core/repo-health.js +31 -15
package/dist/core/roadmap.js +17 -3
package/dist/core/schemas.d.ts +144 -26
package/dist/core/schemas.js +74 -17
package/dist/core/search-budget.d.ts +9 -0
package/dist/core/search-budget.js +36 -3
package/dist/core/search-phases.d.ts +0 -18
package/dist/core/search-phases.js +27 -82
package/dist/core/types.d.ts +146 -30
package/dist/core/utils.js +60 -26
package/dist/formatters/markdown.d.ts +10 -0
package/dist/formatters/markdown.js +31 -0
package/dist/index.d.ts +6 -2
package/dist/index.js +8 -0
package/dist/scout.d.ts +59 -10
package/dist/scout.js +244 -19
package/package.json +1 -1

package/dist/core/personalization.d.ts CHANGED Viewed

@@ -1,15 +1,18 @@
 /**
  * Personalization signals for search ranking (#1244).
  *
- * Translates caller-supplied `preferLanguages` / `preferRepos` lists
- * into a soft `boostScore` on each `IssueCandidate`. The final search
- * sort consults this score between the `recommendation` tier and the
- * raw `viabilityScore`, so personalization reorders ties without
- * changing which candidates pass vetting.
- *
- * This is the minimum-viable subset of Option A in #1244: only language
- * and repo bias, no `boostIssueTypes` / `avoidRepos` / `diversityRatio`
- * yet. Those follow up in separate PRs.
+ * Two passes:
+ *
+ *   - `annotateBoost` translates `preferLanguages` / `preferRepos`
+ *     into a soft `boostScore` consumed by issue-discovery's final
+ *     sort tier between `recommendation` and `viabilityScore`.
+ *   - `applyDiversityRatio` reserves a fraction of the final slot
+ *     budget for candidates that matched no preference, counterweighting
+ *     echo-chamber bias as recommendations accumulate over time.
+ *
+ * Still out of scope for #1244: `boostIssueTypes`, `avoidRepos`, and
+ * render-time annotation of `boostReasons` / `diversitySlot` in the CLI
+ * non-JSON output. Those follow up in separate PRs.
  */
 import type { IssueCandidate } from "./types.js";
 /**
@@ -25,15 +28,45 @@ import type { IssueCandidate } from "./types.js";
 export declare const REPO_BOOST = 20;
 export declare const LANGUAGE_BOOST = 10;
 /**
- * Annotate each candidate with `boostScore` and `boostReasons` based on
- * the caller-supplied preference lists. Mutates the array in place; the
- * caller is responsible for re-sorting afterwards.
+ * The personalization sort weight of a candidate: its boost score, or 0 when it
+ * is not boosted (unboosted or a diversity slot). Reads the structural
+ * `personalization` field (#158) so callers never poke at the old loose
+ * `boostScore` field.
+ */
+export declare function boostScoreOf(candidate: IssueCandidate): number;
+/**
+ * Return a new candidate list where each candidate that matches a
+ * caller-supplied preference carries `personalization: { kind: "boosted", ... }`.
+ * Does NOT mutate the input candidates (#158) — matched candidates are shallow
+ * copies with the field set; unmatched candidates are passed through unchanged.
+ * The caller re-sorts the returned array.
+ *
+ * No-op when both preference lists are empty or undefined: the input array is
+ * returned as-is and the sort tier collapses to 0 for every candidate.
+ */
+export declare function annotateBoost(candidates: IssueCandidate[], preferLanguages?: string[], preferRepos?: string[]): IssueCandidate[];
+/**
+ * Apply a diversity-counterweight pass over a pre-sorted candidate list
+ * (#1244). Returns the first `maxResults` picks in priority order:
+ *
+ *   1. Main slots: `maxResults - floor(maxResults * diversityRatio)`
+ *      top candidates from the input. Personalization-biased candidates
+ *      win these slots when present (since the input is already sorted
+ *      by the personalization tier).
+ *   2. Diversity slots: the highest-ranked candidates that carry NO
+ *      `boostScore` — i.e. they matched neither `preferLanguages` nor
+ *      `preferRepos`. Tagged with `diversitySlot: true` for caller
+ *      transparency.
+ *   3. Top-up: if the diversity pool was thinner than the reserve, fall
+ *      back to the remaining sorted candidates so the user gets
+ *      `maxResults` slots whenever the source has enough material.
  *
- * Mutation (rather than returning new objects) keeps the personalization
- * step a single linear pass over the array the caller already holds —
- * the sort step reads back from the same objects.
+ * `diversityRatio` is clamped to [0, 1]. 0 is a no-op (just slices the
+ * input). 1 means every slot is a diversity slot — useful for
+ * deliberately suppressing personalization without disabling it.
  *
- * No-op when both preference lists are empty or undefined: candidates
- * retain `boostScore: undefined` and the sort tier collapses to 0.
+ * @param candidates    Pre-sorted candidate list (output of issue-discovery)
+ * @param maxResults    Total slots to fill
+ * @param diversityRatio Fraction of slots reserved for unboosted candidates
  */
-export declare function annotateBoost(candidates: IssueCandidate[], preferLanguages?: string[], preferRepos?: string[]): void;
+export declare function applyDiversityRatio(candidates: IssueCandidate[], maxResults: number, diversityRatio: number): IssueCandidate[];

package/dist/core/personalization.js CHANGED Viewed

@@ -1,15 +1,18 @@
 /**
  * Personalization signals for search ranking (#1244).
  *
- * Translates caller-supplied `preferLanguages` / `preferRepos` lists
- * into a soft `boostScore` on each `IssueCandidate`. The final search
- * sort consults this score between the `recommendation` tier and the
- * raw `viabilityScore`, so personalization reorders ties without
- * changing which candidates pass vetting.
- *
- * This is the minimum-viable subset of Option A in #1244: only language
- * and repo bias, no `boostIssueTypes` / `avoidRepos` / `diversityRatio`
- * yet. Those follow up in separate PRs.
+ * Two passes:
+ *
+ *   - `annotateBoost` translates `preferLanguages` / `preferRepos`
+ *     into a soft `boostScore` consumed by issue-discovery's final
+ *     sort tier between `recommendation` and `viabilityScore`.
+ *   - `applyDiversityRatio` reserves a fraction of the final slot
+ *     budget for candidates that matched no preference, counterweighting
+ *     echo-chamber bias as recommendations accumulate over time.
+ *
+ * Still out of scope for #1244: `boostIssueTypes`, `avoidRepos`, and
+ * render-time annotation of `boostReasons` / `diversitySlot` in the CLI
+ * non-JSON output. Those follow up in separate PRs.
  */
 /**
  * Boost weights. Tuned conservatively so personalization tips equally-
@@ -24,37 +27,108 @@
 export const REPO_BOOST = 20;
 export const LANGUAGE_BOOST = 10;
 /**
- * Annotate each candidate with `boostScore` and `boostReasons` based on
- * the caller-supplied preference lists. Mutates the array in place; the
- * caller is responsible for re-sorting afterwards.
- *
- * Mutation (rather than returning new objects) keeps the personalization
- * step a single linear pass over the array the caller already holds —
- * the sort step reads back from the same objects.
+ * The personalization sort weight of a candidate: its boost score, or 0 when it
+ * is not boosted (unboosted or a diversity slot). Reads the structural
+ * `personalization` field (#158) so callers never poke at the old loose
+ * `boostScore` field.
+ */
+export function boostScoreOf(candidate) {
+    return candidate.personalization?.kind === "boosted"
+        ? candidate.personalization.score
+        : 0;
+}
+/**
+ * Return a new candidate list where each candidate that matches a
+ * caller-supplied preference carries `personalization: { kind: "boosted", ... }`.
+ * Does NOT mutate the input candidates (#158) — matched candidates are shallow
+ * copies with the field set; unmatched candidates are passed through unchanged.
+ * The caller re-sorts the returned array.
  *
- * No-op when both preference lists are empty or undefined: candidates
- * retain `boostScore: undefined` and the sort tier collapses to 0.
+ * No-op when both preference lists are empty or undefined: the input array is
+ * returned as-is and the sort tier collapses to 0 for every candidate.
  */
 export function annotateBoost(candidates, preferLanguages, preferRepos) {
     const langSet = new Set((preferLanguages ?? []).map((l) => l.trim().toLowerCase()).filter(Boolean));
-    const repoSet = new Set((preferRepos ?? []).map((r) => r.trim()).filter(Boolean));
+    const repoSet = new Set((preferRepos ?? []).map((r) => r.trim().toLowerCase()).filter(Boolean));
     if (langSet.size === 0 && repoSet.size === 0)
-        return;
-    for (const c of candidates) {
+        return candidates;
+    return candidates.map((c) => {
         let score = 0;
         const reasons = [];
-        if (repoSet.size > 0 && repoSet.has(c.issue.repo)) {
+        if (repoSet.size > 0 && repoSet.has(c.issue.repo.toLowerCase())) {
             score += REPO_BOOST;
             reasons.push(`repo affinity: ${c.issue.repo}`);
         }
-        const lang = c.projectHealth.language;
+        const lang = c.projectHealth.checkFailed ? null : c.projectHealth.language;
         if (langSet.size > 0 && lang && langSet.has(lang.toLowerCase())) {
             score += LANGUAGE_BOOST;
             reasons.push(`language match: ${lang}`);
         }
-        if (score > 0) {
-            c.boostScore = score;
-            c.boostReasons = reasons;
-        }
+        if (score === 0)
+            return c;
+        return { ...c, personalization: { kind: "boosted", score, reasons } };
+    });
+}
+/**
+ * Apply a diversity-counterweight pass over a pre-sorted candidate list
+ * (#1244). Returns the first `maxResults` picks in priority order:
+ *
+ *   1. Main slots: `maxResults - floor(maxResults * diversityRatio)`
+ *      top candidates from the input. Personalization-biased candidates
+ *      win these slots when present (since the input is already sorted
+ *      by the personalization tier).
+ *   2. Diversity slots: the highest-ranked candidates that carry NO
+ *      `boostScore` — i.e. they matched neither `preferLanguages` nor
+ *      `preferRepos`. Tagged with `diversitySlot: true` for caller
+ *      transparency.
+ *   3. Top-up: if the diversity pool was thinner than the reserve, fall
+ *      back to the remaining sorted candidates so the user gets
+ *      `maxResults` slots whenever the source has enough material.
+ *
+ * `diversityRatio` is clamped to [0, 1]. 0 is a no-op (just slices the
+ * input). 1 means every slot is a diversity slot — useful for
+ * deliberately suppressing personalization without disabling it.
+ *
+ * @param candidates    Pre-sorted candidate list (output of issue-discovery)
+ * @param maxResults    Total slots to fill
+ * @param diversityRatio Fraction of slots reserved for unboosted candidates
+ */
+export function applyDiversityRatio(candidates, maxResults, diversityRatio) {
+    if (maxResults <= 0)
+        return [];
+    const ratio = Math.max(0, Math.min(1, diversityRatio));
+    if (ratio === 0)
+        return candidates.slice(0, maxResults);
+    const diversityReserve = Math.min(Math.floor(maxResults * ratio), maxResults);
+    if (diversityReserve === 0)
+        return candidates.slice(0, maxResults);
+    const mainBudget = maxResults - diversityReserve;
+    const picks = [];
+    const seen = new Set();
+    for (const c of candidates) {
+        if (picks.length >= mainBudget)
+            break;
+        picks.push(c);
+        seen.add(c.issue.url);
+    }
+    for (const c of candidates) {
+        if (picks.length >= maxResults)
+            break;
+        if (seen.has(c.issue.url))
+            continue;
+        if (boostScoreOf(c) > 0)
+            continue;
+        // Tag a shallow copy rather than mutating the shared candidate (#158).
+        picks.push({ ...c, personalization: { kind: "diversity" } });
+        seen.add(c.issue.url);
+    }
+    for (const c of candidates) {
+        if (picks.length >= maxResults)
+            break;
+        if (seen.has(c.issue.url))
+            continue;
+        picks.push(c);
+        seen.add(c.issue.url);
     }
+    return picks;
 }

package/dist/core/preference-fields.d.ts ADDED Viewed

@@ -0,0 +1,47 @@
+/**
+ * Shared preference-field metadata and value parsing.
+ *
+ * The CLI (`commands/config.ts`) and the MCP `config-set` tool both update a
+ * single preference from a raw string. They used to carry separate, drifting
+ * copies of the key tables and parse logic — the CLI was missing the SLM
+ * triage keys, the MCP side lacked the `scope` special case and the +/- array
+ * syntax. This module is the single source of truth both drive (#153).
+ */
+import type { ScoutPreferences } from "./schemas.js";
+export type FieldConfig = {
+    type: "array" | "number" | "float" | "boolean" | "string";
+} | {
+    type: "enum" | "enum-array";
+    validValues: readonly string[];
+};
+export declare const FIELD_CONFIGS: Record<string, FieldConfig>;
+/**
+ * Every configurable preference key, derived from the schema so a new
+ * preference can't be silently left unconfigurable. `assertFieldConfigsCover`
+ * (exercised by a unit test) fails loudly if FIELD_CONFIGS drifts from this.
+ */
+export declare const PREFERENCE_KEYS: readonly string[];
+/** Sorted key list for "unknown key" error messages and help text. */
+export declare const SORTED_PREFERENCE_KEYS: readonly string[];
+/**
+ * Throw if any schema preference lacks a FIELD_CONFIG entry. Called from a
+ * test so adding a preference to the schema without teaching config-set how to
+ * parse it is caught in CI rather than at a user's first `config set newKey`.
+ */
+export declare function assertFieldConfigsCover(): void;
+/**
+ * Apply an array update: plain set, +append, or -remove.
+ *
+ * The -remove form starts with a dash, which commander rejects as an unknown
+ * option unless escaped: `config set excludeRepos -- "-spam/repo"`. The MCP
+ * tool has no commander layer so it can pass `-spam/repo` directly. Documented
+ * in the CLI help and README (#132).
+ */
+export declare function updateArray(current: string[], value: string): string[];
+/**
+ * Apply a single key/value update to a preferences object and return the
+ * fully validated result. The raw string `value` is the form both the CLI and
+ * the MCP tool receive; arrays accept comma-separated values and the +add /
+ * -remove syntax. Throws ValidationError on an unknown key or a bad value.
+ */
+export declare function applyPreferenceField(preferences: ScoutPreferences, key: string, value: string): ScoutPreferences;

package/dist/core/preference-fields.js ADDED Viewed

@@ -0,0 +1,178 @@
+/**
+ * Shared preference-field metadata and value parsing.
+ *
+ * The CLI (`commands/config.ts`) and the MCP `config-set` tool both update a
+ * single preference from a raw string. They used to carry separate, drifting
+ * copies of the key tables and parse logic — the CLI was missing the SLM
+ * triage keys, the MCP side lacked the `scope` special case and the +/- array
+ * syntax. This module is the single source of truth both drive (#153).
+ */
+import { ScoutPreferencesSchema, IssueScopeSchema, ProjectCategorySchema, PersistenceModeSchema, SearchStrategySchema, } from "./schemas.js";
+import { ValidationError } from "./errors.js";
+export const FIELD_CONFIGS = {
+    githubUsername: { type: "string" },
+    languages: { type: "array" },
+    labels: { type: "array" },
+    scope: { type: "enum-array", validValues: IssueScopeSchema.options },
+    excludeRepos: { type: "array" },
+    excludeOrgs: { type: "array" },
+    aiPolicyBlocklist: { type: "array" },
+    projectCategories: {
+        type: "enum-array",
+        validValues: ProjectCategorySchema.options,
+    },
+    minStars: { type: "number" },
+    maxIssueAgeDays: { type: "number" },
+    includeDocIssues: { type: "boolean" },
+    minRepoScoreThreshold: { type: "number" },
+    interPhaseDelayMs: { type: "number" },
+    persistence: { type: "enum", validValues: PersistenceModeSchema.options },
+    defaultStrategy: {
+        type: "enum-array",
+        validValues: SearchStrategySchema.options,
+    },
+    broadPhaseDelayMs: { type: "number" },
+    skipBroadWhenSufficientResults: { type: "number" },
+    preferLanguages: { type: "array" },
+    preferRepos: { type: "array" },
+    diversityRatio: { type: "float" },
+    slmTriageModel: { type: "string" },
+    slmTriageHost: { type: "string" },
+    featuresAnchorThreshold: { type: "number" },
+    featuresSplitRatio: { type: "float" },
+};
+/**
+ * Every configurable preference key, derived from the schema so a new
+ * preference can't be silently left unconfigurable. `assertFieldConfigsCover`
+ * (exercised by a unit test) fails loudly if FIELD_CONFIGS drifts from this.
+ */
+export const PREFERENCE_KEYS = Object.keys(ScoutPreferencesSchema.shape);
+/** Sorted key list for "unknown key" error messages and help text. */
+export const SORTED_PREFERENCE_KEYS = [
+    ...PREFERENCE_KEYS,
+].sort();
+/**
+ * Throw if any schema preference lacks a FIELD_CONFIG entry. Called from a
+ * test so adding a preference to the schema without teaching config-set how to
+ * parse it is caught in CI rather than at a user's first `config set newKey`.
+ */
+export function assertFieldConfigsCover() {
+    const missing = PREFERENCE_KEYS.filter((k) => !(k in FIELD_CONFIGS));
+    if (missing.length > 0) {
+        throw new Error(`FIELD_CONFIGS is missing entries for preference keys: ${missing.join(", ")}`);
+    }
+    const extra = Object.keys(FIELD_CONFIGS).filter((k) => !PREFERENCE_KEYS.includes(k));
+    if (extra.length > 0) {
+        throw new Error(`FIELD_CONFIGS has entries for unknown preference keys: ${extra.join(", ")}`);
+    }
+}
+function parseBoolean(value) {
+    const lower = value.toLowerCase();
+    if (lower === "true" || lower === "yes")
+        return true;
+    if (lower === "false" || lower === "no")
+        return false;
+    throw new ValidationError(`Invalid boolean value: "${value}". Use true/false or yes/no.`);
+}
+function parseIntValue(value, key) {
+    const num = parseInt(value, 10);
+    if (isNaN(num)) {
+        throw new ValidationError(`Invalid number for "${key}": "${value}"`);
+    }
+    return num;
+}
+function parseFloatValue(value, key) {
+    const num = Number.parseFloat(value);
+    if (isNaN(num)) {
+        throw new ValidationError(`Invalid number for "${key}": "${value}"`);
+    }
+    return num;
+}
+function parseArrayValue(value) {
+    return value
+        .split(",")
+        .map((s) => s.trim())
+        .filter((s) => s.length > 0);
+}
+/**
+ * Apply an array update: plain set, +append, or -remove.
+ *
+ * The -remove form starts with a dash, which commander rejects as an unknown
+ * option unless escaped: `config set excludeRepos -- "-spam/repo"`. The MCP
+ * tool has no commander layer so it can pass `-spam/repo` directly. Documented
+ * in the CLI help and README (#132).
+ */
+export function updateArray(current, value) {
+    if (value.startsWith("+")) {
+        const toAdd = parseArrayValue(value.slice(1));
+        const merged = [...current];
+        for (const item of toAdd) {
+            if (!merged.includes(item))
+                merged.push(item);
+        }
+        return merged;
+    }
+    if (value.startsWith("-")) {
+        const toRemove = new Set(parseArrayValue(value.slice(1)));
+        return current.filter((item) => !toRemove.has(item));
+    }
+    return parseArrayValue(value);
+}
+/**
+ * Apply a single key/value update to a preferences object and return the
+ * fully validated result. The raw string `value` is the form both the CLI and
+ * the MCP tool receive; arrays accept comma-separated values and the +add /
+ * -remove syntax. Throws ValidationError on an unknown key or a bad value.
+ */
+export function applyPreferenceField(preferences, key, value) {
+    const field = FIELD_CONFIGS[key];
+    if (!field) {
+        throw new ValidationError(`Unknown config key: "${key}". Valid keys: ${SORTED_PREFERENCE_KEYS.join(", ")}`);
+    }
+    const prefs = { ...preferences };
+    switch (field.type) {
+        case "string":
+            prefs[key] = value;
+            break;
+        case "boolean":
+            prefs[key] = parseBoolean(value);
+            break;
+        case "number":
+            prefs[key] = parseIntValue(value, key);
+            break;
+        case "float":
+            prefs[key] = parseFloatValue(value, key);
+            break;
+        case "array": {
+            const current = prefs[key] ?? [];
+            prefs[key] = updateArray(current, value);
+            break;
+        }
+        case "enum": {
+            const validValues = field.validValues;
+            if (!validValues.includes(value)) {
+                throw new ValidationError(`Invalid value for "${key}": "${value}". Valid: ${validValues.join(", ")}`);
+            }
+            prefs[key] = value;
+            break;
+        }
+        case "enum-array": {
+            const current = prefs[key] ?? [];
+            const updated = updateArray(current, value);
+            const validValues = field.validValues;
+            const invalid = updated.filter((s) => !validValues.includes(s));
+            if (invalid.length > 0) {
+                throw new ValidationError(`Invalid value(s) for "${key}": ${invalid.join(", ")}. Valid: ${validValues.join(", ")}`);
+            }
+            // For 'scope', an empty array means undefined (all scopes).
+            if (key === "scope") {
+                prefs[key] = updated.length > 0 ? updated : undefined;
+            }
+            else {
+                prefs[key] = updated;
+            }
+            break;
+        }
+    }
+    return ScoutPreferencesSchema.parse(prefs);
+}

package/dist/core/repo-health.js CHANGED Viewed

@@ -5,7 +5,7 @@
  * from issue-level eligibility logic.
  */
 import { daysBetween } from "./utils.js";
-import { errorMessage, getHttpStatusCode, isRateLimitError } from "./errors.js";
+import { errorMessage, getHttpStatusCode, isRateLimitError, rethrowIfFatal, } from "./errors.js";
 import { warn } from "./logger.js";
 import { getHttpCache, cachedRequest, cachedTimeBased } from "./http-cache.js";
 const MODULE = "repo-health";
@@ -73,19 +73,14 @@ export async function checkProjectHealth(octokit, owner, repo) {
         });
     }
     catch (error) {
-        if (getHttpStatusCode(error) === 401 || isRateLimitError(error)) {
-            throw error;
-        }
+        rethrowIfFatal(error);
         const errMsg = errorMessage(error);
         warn(MODULE, `Error checking project health for ${owner}/${repo}: ${errMsg}`);
+        // The check failed: only the repo and the reason are known. The
+        // discriminated ProjectHealth type intentionally has no place for the
+        // neutral-default snapshot fields this used to fabricate (#158).
         return {
             repo: `${owner}/${repo}`,
-            lastCommitAt: "",
-            daysSinceLastCommit: 999,
-            openIssuesCount: 0,
-            avgIssueResponseDays: 0,
-            ciStatus: "unknown",
-            isActive: false,
             checkFailed: true,
             failureReason: errMsg,
         };
@@ -104,6 +99,22 @@ export async function fetchContributionGuidelines(octokit, owner, repo) {
     if (cached && Date.now() - cached.fetchedAt < CACHE_TTL_MS) {
         return cached.guidelines;
     }
+    // Concurrent vets of issues from one repo share a single probe (#124)
+    const inflight = guidelinesInflight.get(cacheKey);
+    if (inflight)
+        return inflight;
+    const promise = fetchContributionGuidelinesUncached(octokit, owner, repo);
+    guidelinesInflight.set(cacheKey, promise);
+    try {
+        return await promise;
+    }
+    finally {
+        guidelinesInflight.delete(cacheKey);
+    }
+}
+const guidelinesInflight = new Map();
+async function fetchContributionGuidelinesUncached(octokit, owner, repo) {
+    const cacheKey = `${owner}/${repo}`;
     const filesToCheck = [
         "CONTRIBUTING.md",
         ".github/CONTRIBUTING.md",
@@ -160,9 +171,13 @@ function parseContributionGuidelines(content) {
         rawContent: content,
     };
     const lowerContent = content.toLowerCase();
-    // Detect branch naming conventions
+    // Detect branch naming conventions. CONTRIBUTING.md is attacker-controlled
+    // (it belongs to the repo being vetted): the unbounded [^\n]* pair forced
+    // quadratic backtracking on a long quote-less line, stalling the vet
+    // (#152). Bounded quantifiers keep the scan linear-ish; real conventions
+    // sit well inside 200 chars of their keyword.
     if (lowerContent.includes("branch")) {
-        const branchMatch = content.match(/branch[^\n]*(?:named?|format|convention)[^\n]*[`"]([^`"]+)[`"]/i);
+        const branchMatch = content.match(/branch[^\n]{0,200}?(?:named?|format|convention)[^\n]{0,200}?[`"]([^`"\n]{1,100})[`"]/i);
         if (branchMatch) {
             guidelines.branchNamingConvention = branchMatch[1];
         }
@@ -172,7 +187,7 @@ function parseContributionGuidelines(content) {
         guidelines.commitMessageFormat = "conventional commits";
     }
     else if (lowerContent.includes("commit message")) {
-        const commitMatch = content.match(/commit message[^\n]*[`"]([^`"]+)[`"]/i);
+        const commitMatch = content.match(/commit message[^\n]{0,200}?[`"]([^`"\n]{1,100})[`"]/i);
         if (commitMatch) {
             guidelines.commitMessageFormat = commitMatch[1];
         }
@@ -193,8 +208,9 @@ function parseContributionGuidelines(content) {
         guidelines.linter = "RuboCop";
     else if (lowerContent.includes("prettier"))
         guidelines.formatter = "Prettier";
-    // Detect CLA requirement
-    if (lowerContent.includes("cla") ||
+    // Detect CLA requirement. Word boundary matters: a bare substring check
+    // matches "class", "clang", "clarify", etc. and flags nearly every doc.
+    if (/\bcla\b/.test(lowerContent) ||
         lowerContent.includes("contributor license agreement")) {
         guidelines.claRequired = true;
     }

package/dist/core/roadmap.js CHANGED Viewed

@@ -10,7 +10,7 @@
  * Auth (401) and rate-limit errors propagate, matching the rest of the
  * codebase's error strategy. Other errors degrade gracefully (warn + empty).
  */
-import { errorMessage, getHttpStatusCode, isRateLimitError } from "./errors.js";
+import { errorMessage, getHttpStatusCode, rethrowIfFatal } from "./errors.js";
 import { warn } from "./logger.js";
 const MODULE = "roadmap";
 /** TTL for roadmap fetch results (1 hour). */
@@ -97,6 +97,21 @@ export async function fetchRoadmapIssueRefs(octokit, owner, repo) {
     if (cached && Date.now() - cached.fetchedAt < CACHE_TTL_MS) {
         return cached.refs;
     }
+    // Concurrent feature vets of issues from one repo share a probe (#124)
+    const inflight = roadmapInflight.get(cacheKey);
+    if (inflight)
+        return inflight;
+    const promise = fetchRoadmapIssueRefsUncached(octokit, owner, repo, cacheKey);
+    roadmapInflight.set(cacheKey, promise);
+    try {
+        return await promise;
+    }
+    finally {
+        roadmapInflight.delete(cacheKey);
+    }
+}
+const roadmapInflight = new Map();
+async function fetchRoadmapIssueRefsUncached(octokit, owner, repo, cacheKey) {
     for (const path of ROADMAP_PATHS) {
         try {
             const { data } = await octokit.repos.getContent({ owner, repo, path });
@@ -109,8 +124,7 @@ export async function fetchRoadmapIssueRefs(octokit, owner, repo) {
             return refs;
         }
         catch (err) {
-            if (getHttpStatusCode(err) === 401 || isRateLimitError(err))
-                throw err;
+            rethrowIfFatal(err);
             const status = getHttpStatusCode(err);
             if (status === 404)
                 continue; // path missing — try next