npm - @adityanair98/api-oracle - Versions diffs - 0.5.0 - Mend

@adityanair98/api-oracle 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (119) hide show

package/LICENSE +21 -0
package/README.md +216 -0
package/dist/cli.d.ts +11 -0
package/dist/cli.js +74 -0
package/dist/dashboard/public/app.js +1004 -0
package/dist/dashboard/public/index.html +142 -0
package/dist/dashboard/public/public/app.js +1004 -0
package/dist/dashboard/public/public/index.html +142 -0
package/dist/dashboard/public/public/styles.css +1464 -0
package/dist/dashboard/public/styles.css +1464 -0
package/dist/dashboard/routes/api.d.ts +7 -0
package/dist/dashboard/routes/api.js +245 -0
package/dist/dashboard/server.d.ts +9 -0
package/dist/dashboard/server.js +45 -0
package/dist/index.d.ts +5 -0
package/dist/index.js +23 -0
package/dist/knowledge/db.d.ts +22 -0
package/dist/knowledge/db.js +182 -0
package/dist/knowledge/schema.d.ts +275 -0
package/dist/knowledge/schema.js +135 -0
package/dist/knowledge/scorer.d.ts +63 -0
package/dist/knowledge/scorer.js +314 -0
package/dist/knowledge/search.d.ts +37 -0
package/dist/knowledge/search.js +111 -0
package/dist/knowledge/synonyms.d.ts +36 -0
package/dist/knowledge/synonyms.js +523 -0
package/dist/knowledge/tfidf.d.ts +42 -0
package/dist/knowledge/tfidf.js +138 -0
package/dist/server.d.ts +9 -0
package/dist/server.js +40 -0
package/dist/tools/check-freshness.d.ts +9 -0
package/dist/tools/check-freshness.js +95 -0
package/dist/tools/compare-apis.d.ts +8 -0
package/dist/tools/compare-apis.js +149 -0
package/dist/tools/find-api.d.ts +9 -0
package/dist/tools/find-api.js +120 -0
package/dist/tools/get-setup-guide.d.ts +8 -0
package/dist/tools/get-setup-guide.js +127 -0
package/dist/updater/linter.d.ts +31 -0
package/dist/updater/linter.js +219 -0
package/dist/updater/report.d.ts +29 -0
package/dist/updater/report.js +96 -0
package/dist/updater/staleness.d.ts +39 -0
package/dist/updater/staleness.js +66 -0
package/dist/updater/version-tracker.d.ts +28 -0
package/dist/updater/version-tracker.js +50 -0
package/dist/utils/config.d.ts +11 -0
package/dist/utils/config.js +13 -0
package/dist/utils/logger.d.ts +20 -0
package/dist/utils/logger.js +32 -0
package/package.json +56 -0
package/src/entries/ai/anthropic.json +95 -0
package/src/entries/ai/eleven-labs.json +90 -0
package/src/entries/ai/openai.json +95 -0
package/src/entries/ai/replicate.json +87 -0
package/src/entries/ai/resemble-ai.json +88 -0
package/src/entries/ai/stability-ai.json +89 -0
package/src/entries/analytics/posthog.json +88 -0
package/src/entries/analytics/sentry.json +84 -0
package/src/entries/auth/auth0.json +90 -0
package/src/entries/auth/clerk.json +95 -0
package/src/entries/cms/contentful.json +92 -0
package/src/entries/cms/sanity.json +92 -0
package/src/entries/cms/strapi.json +93 -0
package/src/entries/commerce/medusa.json +91 -0
package/src/entries/commerce/shopify-api.json +91 -0
package/src/entries/communication/sendbird.json +85 -0
package/src/entries/communication/stream-chat.json +94 -0
package/src/entries/database/firebase.json +88 -0
package/src/entries/database/neon.json +94 -0
package/src/entries/database/planetscale.json +95 -0
package/src/entries/database/supabase.json +94 -0
package/src/entries/database/upstash.json +94 -0
package/src/entries/devops/fly-io.json +90 -0
package/src/entries/devops/netlify.json +90 -0
package/src/entries/devops/railway.json +90 -0
package/src/entries/devops/vercel.json +90 -0
package/src/entries/email/mailgun.json +91 -0
package/src/entries/email/postmark.json +91 -0
package/src/entries/email/resend.json +89 -0
package/src/entries/email/sendgrid.json +90 -0
package/src/entries/forms/formspark.json +85 -0
package/src/entries/forms/typeform.json +98 -0
package/src/entries/infrastructure/aws-s3.json +104 -0
package/src/entries/infrastructure/cloudflare-r2.json +92 -0
package/src/entries/infrastructure/cloudflare-workers.json +92 -0
package/src/entries/infrastructure/digital-ocean-spaces.json +87 -0
package/src/entries/integration/nango.json +90 -0
package/src/entries/integration/zapier.json +92 -0
package/src/entries/maps/google-maps.json +89 -0
package/src/entries/maps/mapbox.json +87 -0
package/src/entries/media/deepgram.json +84 -0
package/src/entries/media/imgix.json +84 -0
package/src/entries/media/mux.json +94 -0
package/src/entries/messaging/ably.json +94 -0
package/src/entries/messaging/pusher.json +94 -0
package/src/entries/messaging/twilio.json +94 -0
package/src/entries/messaging/vonage.json +89 -0
package/src/entries/notifications/knock.json +84 -0
package/src/entries/notifications/novu.json +84 -0
package/src/entries/notifications/onesignal.json +84 -0
package/src/entries/payments/lemonsqueezy.json +91 -0
package/src/entries/payments/paddle.json +90 -0
package/src/entries/payments/paypal.json +91 -0
package/src/entries/payments/razorpay.json +85 -0
package/src/entries/payments/square.json +91 -0
package/src/entries/payments/stripe.json +96 -0
package/src/entries/scheduling/cal-com.json +90 -0
package/src/entries/scheduling/calendly.json +90 -0
package/src/entries/search/algolia.json +96 -0
package/src/entries/security/arcjet.json +89 -0
package/src/entries/security/snyk.json +90 -0
package/src/entries/storage/cloudinary.json +93 -0
package/src/entries/storage/uploadthing.json +90 -0
package/src/entries/testing/browserstack.json +86 -0
package/src/entries/testing/checkly.json +89 -0
package/src/entries/workflow/inngest.json +88 -0
package/src/entries/workflow/temporal.json +90 -0
package/src/entries/workflow/trigger-dev.json +89 -0

package/dist/knowledge/scorer.js ADDED Viewed

@@ -0,0 +1,314 @@
+/**
+ * Scoring/ranking engine — ranks API entries by relevance to a task description.
+ * Uses weighted multi-factor scoring across 6 dimensions.
+ *
+ * Exports: SCORING_WEIGHTS, DEFAULT_WEIGHTS, ScoreWeights, scoreEntry, rankEntries,
+ *          tokenize, scoreUseCaseFit, scoreDevExperience
+ */
+/** Default weights — must sum to exactly 1.0 */
+export const SCORING_WEIGHTS = {
+    useCaseFit: 0.35,
+    qualityScore: 0.20,
+    developerExperience: 0.15,
+    pricingFit: 0.15,
+    keywordRelevance: 0.10,
+    recencyBonus: 0.05,
+};
+/** Alias for backwards compatibility */
+export const DEFAULT_WEIGHTS = SCORING_WEIGHTS;
+// ─── Tokenizer ────────────────────────────────────────────────────────────────
+// Stop words that add noise without semantic value in the scoring context
+const STOP_WORDS = new Set([
+    "the", "and", "for", "are", "but", "not", "you", "all",
+    "can", "her", "was", "one", "our", "out", "had", "has",
+    "with", "this", "that", "from", "they", "have", "been",
+    "more", "will", "when", "what", "your", "which", "how",
+    "any", "use", "get", "let", "its", "also", "want", "need",
+    "build", "add", "make", "app", "just",
+]);
+/**
+ * Normalize text to a set of lowercase tokens.
+ * Allows 2-char tokens (important for "ai", "db", "ml", "go").
+ */
+export function tokenize(text) {
+    const tokens = text
+        .toLowerCase()
+        .replace(/[^a-z0-9\s]/g, " ")
+        .split(/\s+/)
+        .filter((t) => t.length >= 2 && !STOP_WORDS.has(t));
+    return new Set(tokens);
+}
+/** Compute Jaccard-like overlap score between two token sets */
+function tokenOverlap(a, b) {
+    if (a.size === 0 || b.size === 0)
+        return 0;
+    let overlap = 0;
+    for (const token of a) {
+        if (b.has(token))
+            overlap++;
+    }
+    return overlap / Math.max(a.size, b.size);
+}
+// ─── Category Signals ─────────────────────────────────────────────────────────
+const CATEGORY_SIGNALS = {
+    email: ["email", "mail", "smtp", "send", "transactional", "newsletter", "inbox", "bounce", "mailer"],
+    payments: ["payment", "pay", "checkout", "charge", "billing", "invoice", "subscription", "card", "upi", "merchant", "transaction"],
+    ai: ["ai", "ml", "llm", "gpt", "claude", "openai", "anthropic", "model", "completion", "embedding", "chatbot", "generate", "inference", "generative"],
+    storage: ["upload", "file", "image", "video", "media", "storage", "cdn", "asset", "photo", "bucket", "picture", "avatar"],
+    search: ["search", "query", "index", "algolia", "fulltext", "autocomplete", "facet", "filter", "typeahead"],
+    auth: ["auth", "authentication", "login", "signin", "signup", "oauth", "sso", "identity", "session", "token", "jwt", "credential"],
+    messaging: ["sms", "text", "message", "messaging", "phone", "call", "voice", "telephony", "twilio", "vonage"],
+    analytics: ["analytics", "tracking", "metrics", "event", "crash", "exception", "error", "monitoring", "observability", "posthog", "sentry"],
+    database: ["database", "db", "sql", "nosql", "postgres", "mysql", "query", "datastore", "backend", "persist"],
+    media: ["audio", "video", "stream", "transcribe", "transcode", "speech", "mux", "deepgram"],
+    notifications: ["notification", "push", "alert", "bell", "notify", "apns", "fcm"],
+    maps: ["map", "maps", "geo", "location", "address", "geocode", "navigation", "direction", "coordinate"],
+    communication: ["chat", "conversation", "channel", "room", "thread", "realtime", "websocket", "pusher", "ably"],
+};
+function scoreCategoryMatch(queryTokens, category) {
+    const signals = CATEGORY_SIGNALS[category] ?? [];
+    if (signals.length === 0)
+        return 0;
+    const signalSet = new Set(signals);
+    let matched = 0;
+    for (const token of queryTokens) {
+        if (signalSet.has(token))
+            matched++;
+    }
+    return Math.min(matched / 3, 1.0);
+}
+// ─── 1. Use Case Fit (multi-field) ────────────────────────────────────────────
+const FIT_WEIGHTS = {
+    perfect: 1.0,
+    good: 0.7,
+    partial: 0.4,
+};
+/**
+ * Score against multiple fields with weighted relevance:
+ * - Use case tasks (40%) — with fit multiplier, best match wins
+ * - bestFor (25%) — concise purpose statement
+ * - Description (20%) — first 200 chars (signal-dense)
+ * - Category signals (15%) — broad category alignment
+ */
+export function scoreUseCaseFit(entry, queryTokens) {
+    if (queryTokens.size === 0)
+        return 0;
+    // Use case task matching
+    let bestUseCaseScore = 0;
+    for (const useCase of entry.useCases) {
+        const useCaseTokens = tokenize(useCase.task);
+        const overlap = tokenOverlap(queryTokens, useCaseTokens);
+        const score = overlap * FIT_WEIGHTS[useCase.fit];
+        if (score > bestUseCaseScore)
+            bestUseCaseScore = score;
+    }
+    // bestFor
+    const bestForScore = tokenOverlap(queryTokens, tokenize(entry.bestFor));
+    // Description (first 200 chars)
+    const descScore = tokenOverlap(queryTokens, tokenize(entry.description.slice(0, 200)));
+    // Category match
+    const categoryScore = scoreCategoryMatch(queryTokens, entry.category);
+    return Math.min(bestUseCaseScore * 0.40 +
+        bestForScore * 0.25 +
+        descScore * 0.20 +
+        categoryScore * 0.15, 1.0);
+}
+// ─── 2. Quality Score ─────────────────────────────────────────────────────────
+function scoreQuality(entry) {
+    return (entry.qualityScore - 1) / 9;
+}
+// ─── 3. Developer Experience (sub-scored) ─────────────────────────────────────
+/**
+ * DX sub-scoring with measurable, explicit factors:
+ * - TypeScript as primary SDK: 3 pts
+ * - 2+ code examples: 2 pts
+ * - envVarName defined (clear auth setup): 1 pt
+ * - Single npm install command: 1 pt
+ * - Multiple language SDKs (3+): 1 pt
+ * - Required language match: up to 2 pts (only when requiredLanguage is specified)
+ *
+ * Normalized to 0-1 range. Base max = 8 pts; with language constraint = 10 pts.
+ */
+export function scoreDevExperience(entry, constraints) {
+    let score = 0;
+    let maxScore = 8;
+    // TypeScript primary SDK (+3)
+    if (entry.sdk.primaryLanguage.toLowerCase() === "typescript") {
+        score += 3;
+    }
+    else if (entry.sdk.otherLanguages.some((l) => l.toLowerCase() === "typescript")) {
+        score += 1.5;
+    }
+    // 2+ code examples (+2)
+    if (entry.codeExamples.length >= 2) {
+        score += 2;
+    }
+    else if (entry.codeExamples.length === 1) {
+        score += 1;
+    }
+    // envVarName defined — clear auth setup (+1)
+    if (entry.auth.envVarName && entry.auth.envVarName.length > 0) {
+        score += 1;
+    }
+    // Single npm install command (+1)
+    if (entry.sdk.installCommand.includes("npm install")) {
+        score += 1;
+    }
+    // Multiple language SDKs (3+) (+1)
+    if (entry.sdk.otherLanguages.length >= 3) {
+        score += 1;
+    }
+    // Required language match (only when constraint specified; +2)
+    if (constraints?.requiredLanguage) {
+        maxScore += 2;
+        const required = constraints.requiredLanguage.toLowerCase();
+        if (entry.sdk.primaryLanguage.toLowerCase() === required) {
+            score += 2;
+        }
+        else if (entry.sdk.otherLanguages.some((l) => l.toLowerCase() === required)) {
+            score += 1;
+        }
+    }
+    return score / maxScore;
+}
+// ─── 4. Pricing Fit ───────────────────────────────────────────────────────────
+function scorePricingFit(entry, constraints) {
+    if (constraints?.preferFree) {
+        // preferFree: generous free tier or open source scores highest
+        if (entry.pricing.model === "free" || entry.pricing.model === "open_source") {
+            return 1.0;
+        }
+        if (entry.pricing.model === "freemium" && entry.pricing.freeTier !== null) {
+            return 0.85;
+        }
+        if (entry.pricing.model === "usage_based") {
+            return 0.60; // Can be free at low usage
+        }
+        return 0.20; // Paid-only is a poor match
+    }
+    // No pricing constraint — slight boost for easy-to-start options
+    if (entry.pricing.model === "free" || entry.pricing.model === "open_source") {
+        return 0.70;
+    }
+    if (entry.pricing.model === "freemium") {
+        return 0.65;
+    }
+    if (entry.pricing.model === "usage_based") {
+        return 0.60;
+    }
+    return 0.50; // Paid — neutral
+}
+// ─── 5. Keyword Relevance ─────────────────────────────────────────────────────
+/**
+ * Direct keyword relevance: checks if query tokens appear in name/slug/subcategory.
+ * This rewards exact API name matches ("algolia" for search queries, "stripe" for payments).
+ */
+function scoreKeywordRelevance(entry, queryTokens) {
+    const nameTokens = tokenize(entry.name);
+    const slugTokens = tokenize(entry.slug.replace(/-/g, " "));
+    const subCatTokens = tokenize(entry.subcategory.replace(/-/g, " "));
+    // Boost when API name or slug appears in query (user named the tool directly)
+    const nameMatch = tokenOverlap(queryTokens, nameTokens);
+    const slugMatch = tokenOverlap(queryTokens, slugTokens);
+    const subCatMatch = tokenOverlap(queryTokens, subCatTokens);
+    // Name match is strongest signal (user asked for "stripe" or "algolia" by name)
+    return Math.min(nameMatch * 0.5 + slugMatch * 0.3 + subCatMatch * 0.2, 1.0);
+}
+// ─── 6. Recency Bonus ─────────────────────────────────────────────────────────
+const NOW_MS = Date.now();
+const MS_PER_DAY = 86_400_000;
+/**
+ * Recency bonus: entries verified within 30 days score 1.0.
+ * Scales linearly to 0 at 365 days. Older entries score 0.
+ */
+function scoreRecency(entry) {
+    try {
+        const verifiedMs = new Date(entry.lastVerified).getTime();
+        const daysOld = (NOW_MS - verifiedMs) / MS_PER_DAY;
+        if (daysOld <= 30)
+            return 1.0;
+        if (daysOld <= 365)
+            return 1.0 - (daysOld - 30) / 335;
+        return 0;
+    }
+    catch {
+        return 0;
+    }
+}
+// ─── Category Boost ───────────────────────────────────────────────────────────
+function applyCategoryBoost(score, entry, detectedCategory, detectedConfidence) {
+    if (!detectedCategory || detectedConfidence < 0.4)
+        return score;
+    if (entry.category === detectedCategory) {
+        const boost = detectedConfidence * 0.12; // Up to 12% boost
+        return Math.min(score * (1 + boost), 1.0);
+    }
+    return score;
+}
+// ─── Confidence Score ─────────────────────────────────────────────────────────
+/**
+ * Compute a confidence value (0-1) for how certain we are about the top result.
+ *
+ * High confidence (>0.8): strong category match + high useCaseFit score
+ * Medium confidence (0.5-0.8): partial signals
+ * Low confidence (<0.5): weak query, no clear category
+ */
+export function computeConfidence(topResult, detectedCategory, detectedConfidence, allResults) {
+    const useCaseFit = topResult.scoreBreakdown["useCaseFit"] ?? 0;
+    const totalScore = topResult.score;
+    // Factor 1: useCaseFit raw score quality
+    const fitSignal = Math.min(useCaseFit / 0.5, 1.0); // 0.5+ useCaseFit → full signal
+    // Factor 2: category detection confidence
+    const catSignal = detectedCategory ? detectedConfidence : 0;
+    // Factor 3: score separation (top result vs runner-up)
+    const separation = allResults.length >= 2
+        ? Math.min((totalScore - allResults[1].score) * 5, 1.0)
+        : 0.5;
+    // Weighted combination
+    const raw = fitSignal * 0.40 + catSignal * 0.35 + separation * 0.25;
+    return Math.round(Math.min(raw, 1.0) * 100) / 100;
+}
+/** Human-readable confidence label */
+export function confidenceLabel(confidence) {
+    if (confidence >= 0.7)
+        return "high";
+    if (confidence >= 0.4)
+        return "medium";
+    return "low";
+}
+// ─── Main Scoring Function ────────────────────────────────────────────────────
+export function scoreEntry(entry, query, constraints, weights = SCORING_WEIGHTS, context) {
+    const effectiveQuery = context?.expandedQuery ?? query;
+    const queryTokens = tokenize(effectiveQuery);
+    const useCaseFitRaw = scoreUseCaseFit(entry, queryTokens);
+    const qualityRaw = scoreQuality(entry);
+    const devExperienceRaw = scoreDevExperience(entry, constraints);
+    const pricingFitRaw = scorePricingFit(entry, constraints);
+    const keywordRelevanceRaw = scoreKeywordRelevance(entry, queryTokens);
+    const recencyRaw = scoreRecency(entry);
+    const baseScore = useCaseFitRaw * weights.useCaseFit +
+        qualityRaw * weights.qualityScore +
+        devExperienceRaw * weights.developerExperience +
+        pricingFitRaw * weights.pricingFit +
+        keywordRelevanceRaw * weights.keywordRelevance +
+        recencyRaw * weights.recencyBonus;
+    const totalScore = applyCategoryBoost(baseScore, entry, context?.detectedCategory ?? null, context?.detectedConfidence ?? 0);
+    const scoreBreakdown = {
+        useCaseFit: Math.round(useCaseFitRaw * 100) / 100,
+        qualityScore: Math.round(qualityRaw * 100) / 100,
+        developerExperience: Math.round(devExperienceRaw * 100) / 100,
+        pricingFit: Math.round(pricingFitRaw * 100) / 100,
+        keywordRelevance: Math.round(keywordRelevanceRaw * 100) / 100,
+        recencyBonus: Math.round(recencyRaw * 100) / 100,
+        total: Math.round(totalScore * 100) / 100,
+    };
+    return { entry, score: totalScore, scoreBreakdown };
+}
+// ─── Ranking Function ─────────────────────────────────────────────────────────
+export function rankEntries(entries, query, constraints, topN = 3, weights = SCORING_WEIGHTS, context) {
+    if (entries.length === 0)
+        return [];
+    const scored = entries.map((entry) => scoreEntry(entry, query, constraints, weights, context));
+    scored.sort((a, b) => b.score - a.score);
+    return scored.slice(0, topN);
+}

package/dist/knowledge/search.d.ts ADDED Viewed

@@ -0,0 +1,37 @@
+/**
+ * Search layer — combines SQLite text search with the scoring engine.
+ * Uses synonym expansion and category detection to improve result quality.
+ *
+ * Exports: SearchConstraints, RankedResult, findApis, getApiBySlug, getApisByCategory
+ */
+import type { ApiEntry } from "./schema.js";
+export interface SearchConstraints {
+    maxPrice?: string;
+    requiredLanguage?: string;
+    preferFree?: boolean;
+}
+export interface RankedResult {
+    entry: ApiEntry;
+    score: number;
+    scoreBreakdown: Record<string, number>;
+    /** Confidence in this recommendation (0-1); only set on the top result */
+    confidence?: number;
+    /** Human-readable confidence label: "high" | "medium" | "low" */
+    confidenceLabel?: "high" | "medium" | "low";
+}
+/**
+ * Find and rank APIs for a given task description.
+ *
+ * Pipeline:
+ * 1. Detect phrases (preferFree, open source, etc.) — merge with constraints
+ * 2. Expand query with synonyms
+ * 3. SQLite text search on the expanded query (broader candidate pool)
+ * 4. Also text-search on original query (catches exact matches)
+ * 5. Detect category for scoring boost
+ * 6. Rank all candidates with scorer using expanded query + context
+ */
+export declare function findApis(query: string, constraints?: SearchConstraints, topN?: number): RankedResult[];
+/** Get a single API entry by its slug */
+export declare function getApiBySlug(slug: string): ApiEntry | null;
+/** Get all APIs in a category, ranked by quality score */
+export declare function getApisByCategory(category: string): ApiEntry[];

package/dist/knowledge/search.js ADDED Viewed

@@ -0,0 +1,111 @@
+/**
+ * Search layer — combines SQLite text search with the scoring engine.
+ * Uses synonym expansion and category detection to improve result quality.
+ *
+ * Exports: SearchConstraints, RankedResult, findApis, getApiBySlug, getApisByCategory
+ */
+import { getAllEntries, getBySlug, getByCategory } from "./db.js";
+import { rankEntries, computeConfidence, confidenceLabel } from "./scorer.js";
+import { expandQuery, detectCategory, detectPhrases } from "./synonyms.js";
+import { getTfIdfEngine } from "./tfidf.js";
+import { createLogger } from "../utils/logger.js";
+const logger = createLogger("search");
+/**
+ * Find and rank APIs for a given task description.
+ *
+ * Pipeline:
+ * 1. Detect phrases (preferFree, open source, etc.) — merge with constraints
+ * 2. Expand query with synonyms
+ * 3. SQLite text search on the expanded query (broader candidate pool)
+ * 4. Also text-search on original query (catches exact matches)
+ * 5. Detect category for scoring boost
+ * 6. Rank all candidates with scorer using expanded query + context
+ */
+export function findApis(query, constraints, topN = 3) {
+    logger.debug("findApis called", { query, constraints, topN });
+    if (!query || query.trim().length === 0) {
+        logger.warn("Empty query provided to findApis");
+        return [];
+    }
+    const trimmedQuery = query.trim();
+    // Step 1: Phrase detection — auto-apply preferFree from query language
+    const phrases = detectPhrases(trimmedQuery);
+    const effectiveConstraints = {
+        ...constraints,
+        preferFree: constraints?.preferFree ?? phrases.preferFree,
+    };
+    // Step 2: Synonym expansion
+    const expandedQuery = expandQuery(trimmedQuery);
+    logger.debug("Query expanded", {
+        original: trimmedQuery,
+        expanded: expandedQuery.length > trimmedQuery.length
+            ? `${expandedQuery.slice(0, 80)}...`
+            : "unchanged",
+    });
+    // Step 3: Category detection for scoring context
+    const { category: detectedCategory, confidence: detectedConfidence } = detectCategory(trimmedQuery);
+    logger.debug("Category detected", { detectedCategory, detectedConfidence });
+    const scoringContext = {
+        expandedQuery,
+        detectedCategory,
+        detectedConfidence,
+    };
+    // Step 4: Build candidate pool via TF-IDF index
+    // Lazily build the index from all entries on first call
+    const all = getAllEntries();
+    const engine = getTfIdfEngine();
+    if (!engine.isBuilt) {
+        engine.build(all);
+        logger.debug("TF-IDF index built", { entryCount: engine.size });
+    }
+    // TF-IDF search on expanded query (broader recall than LIKE)
+    const tfIdfCandidates = engine.search(expandedQuery, topN * 8);
+    let candidates = tfIdfCandidates;
+    const seenSlugs = new Set(candidates.map((e) => e.slug));
+    // Also include all entries in the detected category (high-signal candidates)
+    if (detectedCategory && detectedConfidence >= 0.4) {
+        const categoryEntries = getByCategory(detectedCategory);
+        for (const entry of categoryEntries) {
+            if (!seenSlugs.has(entry.slug)) {
+                candidates.push(entry);
+                seenSlugs.add(entry.slug);
+            }
+        }
+    }
+    // Safety net: if still fewer candidates than requested, add remaining entries
+    if (candidates.length < topN) {
+        logger.debug("Broadening to all entries — too few TF-IDF candidates", {
+            candidateCount: candidates.length,
+        });
+        for (const entry of all) {
+            if (!seenSlugs.has(entry.slug)) {
+                candidates.push(entry);
+                seenSlugs.add(entry.slug);
+            }
+        }
+    }
+    // Step 5: Rank with scorer using expanded query + context
+    const results = rankEntries(candidates, trimmedQuery, effectiveConstraints, topN, undefined, scoringContext);
+    // Step 6: Attach confidence to top result
+    if (results.length > 0 && results[0]) {
+        const conf = computeConfidence(results[0], detectedCategory, detectedConfidence, results);
+        results[0].confidence = conf;
+        results[0].confidenceLabel = confidenceLabel(conf);
+    }
+    logger.debug("findApis results", {
+        candidateCount: candidates.length,
+        resultCount: results.length,
+        topSlug: results[0]?.entry.slug,
+        confidence: results[0]?.confidence,
+        detectedCategory,
+    });
+    return results;
+}
+/** Get a single API entry by its slug */
+export function getApiBySlug(slug) {
+    return getBySlug(slug);
+}
+/** Get all APIs in a category, ranked by quality score */
+export function getApisByCategory(category) {
+    return getByCategory(category);
+}

package/dist/knowledge/synonyms.d.ts ADDED Viewed

@@ -0,0 +1,36 @@
+/**
+ * Synonym expansion, phrase detection, and category detection for query processing.
+ *
+ * Exports:
+ *   SYNONYM_GROUPS      — raw synonym groups for testing
+ *   expandQuery         — expands a query with synonyms
+ *   detectPhrases       — extracts modifier intent from a query
+ *   detectCategory      — maps a query to a known category with confidence
+ */
+export declare const SYNONYM_GROUPS: readonly string[][];
+/**
+ * Expand a query by adding synonyms for any terms it contains.
+ * Example: "log in with Google" → "log in with Google auth authentication
+ *           login signin signup register sso oauth identity..."
+ */
+export declare function expandQuery(query: string): string;
+export interface PhraseModifiers {
+    /** User wants free or cheap options */
+    preferFree: boolean;
+    /** User wants open-source or self-hostable options */
+    preferOpenSource: boolean;
+    /** User emphasizes reliability / production-grade */
+    preferReliable: boolean;
+    /** Serverless / edge / Vercel context */
+    preferServerless: boolean;
+    /** Reference to another API ("like Firebase but...") */
+    referenceSlug: string | null;
+}
+/** Extract modifier intent from a query */
+export declare function detectPhrases(query: string): PhraseModifiers;
+export interface CategoryMatch {
+    category: string | null;
+    confidence: number;
+}
+/** Detect the most likely category for a query, with a confidence score */
+export declare function detectCategory(query: string): CategoryMatch;