npm - @ansvar/us-regulations-mcp - Versions diffs - 1.0.0 - Mend

@ansvar/us-regulations-mcp 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (89) hide show

package/LICENSE +190 -0
package/README.md +275 -0
package/data/.gitkeep +0 -0
package/data/regulations.db +0 -0
package/data/seed/applicability/rules.json +74 -0
package/data/seed/mappings/ccpa-nist-csf.json +144 -0
package/data/seed/mappings/hipaa-nist-800-53.json +377 -0
package/dist/index.d.ts +3 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +41 -0
package/dist/index.js.map +1 -0
package/dist/ingest/adapters/california-leginfo.d.ts +72 -0
package/dist/ingest/adapters/california-leginfo.d.ts.map +1 -0
package/dist/ingest/adapters/california-leginfo.js +270 -0
package/dist/ingest/adapters/california-leginfo.js.map +1 -0
package/dist/ingest/adapters/ecfr.d.ts +76 -0
package/dist/ingest/adapters/ecfr.d.ts.map +1 -0
package/dist/ingest/adapters/ecfr.js +355 -0
package/dist/ingest/adapters/ecfr.js.map +1 -0
package/dist/ingest/adapters/regulations-gov.d.ts +47 -0
package/dist/ingest/adapters/regulations-gov.d.ts.map +1 -0
package/dist/ingest/adapters/regulations-gov.js +91 -0
package/dist/ingest/adapters/regulations-gov.js.map +1 -0
package/dist/ingest/framework.d.ts +84 -0
package/dist/ingest/framework.d.ts.map +1 -0
package/dist/ingest/framework.js +8 -0
package/dist/ingest/framework.js.map +1 -0
package/dist/tools/action-items.d.ts +23 -0
package/dist/tools/action-items.d.ts.map +1 -0
package/dist/tools/action-items.js +118 -0
package/dist/tools/action-items.js.map +1 -0
package/dist/tools/applicability.d.ts +26 -0
package/dist/tools/applicability.d.ts.map +1 -0
package/dist/tools/applicability.js +49 -0
package/dist/tools/applicability.js.map +1 -0
package/dist/tools/compare.d.ts +20 -0
package/dist/tools/compare.d.ts.map +1 -0
package/dist/tools/compare.js +35 -0
package/dist/tools/compare.js.map +1 -0
package/dist/tools/definitions.d.ts +22 -0
package/dist/tools/definitions.d.ts.map +1 -0
package/dist/tools/definitions.js +43 -0
package/dist/tools/definitions.js.map +1 -0
package/dist/tools/evidence.d.ts +23 -0
package/dist/tools/evidence.d.ts.map +1 -0
package/dist/tools/evidence.js +27 -0
package/dist/tools/evidence.js.map +1 -0
package/dist/tools/list.d.ts +25 -0
package/dist/tools/list.d.ts.map +1 -0
package/dist/tools/list.js +66 -0
package/dist/tools/list.js.map +1 -0
package/dist/tools/map.d.ts +26 -0
package/dist/tools/map.d.ts.map +1 -0
package/dist/tools/map.js +58 -0
package/dist/tools/map.js.map +1 -0
package/dist/tools/registry.d.ts +19 -0
package/dist/tools/registry.d.ts.map +1 -0
package/dist/tools/registry.js +260 -0
package/dist/tools/registry.js.map +1 -0
package/dist/tools/search.d.ts +15 -0
package/dist/tools/search.d.ts.map +1 -0
package/dist/tools/search.js +94 -0
package/dist/tools/search.js.map +1 -0
package/dist/tools/section.d.ts +19 -0
package/dist/tools/section.d.ts.map +1 -0
package/dist/tools/section.js +50 -0
package/dist/tools/section.js.map +1 -0
package/package.json +76 -0
package/scripts/build-db.ts +268 -0
package/scripts/ingest.ts +214 -0
package/scripts/load-seed-data.ts +133 -0
package/scripts/quality-test.ts +346 -0
package/scripts/test-mcp-tools.ts +187 -0
package/scripts/test-remaining-tools.ts +107 -0
package/src/index.ts +55 -0
package/src/ingest/adapters/california-leginfo.ts +322 -0
package/src/ingest/adapters/ecfr.ts +403 -0
package/src/ingest/adapters/regulations-gov.ts +112 -0
package/src/ingest/framework.ts +92 -0
package/src/tools/action-items.ts +164 -0
package/src/tools/applicability.ts +91 -0
package/src/tools/compare.ts +61 -0
package/src/tools/definitions.ts +79 -0
package/src/tools/evidence.ts +53 -0
package/src/tools/list.ts +120 -0
package/src/tools/map.ts +100 -0
package/src/tools/registry.ts +275 -0
package/src/tools/search.ts +132 -0
package/src/tools/section.ts +85 -0

package/src/tools/registry.ts ADDED Viewed

@@ -0,0 +1,275 @@
+import { Server } from '@modelcontextprotocol/sdk/server/index.js';
+import {
+  CallToolRequestSchema,
+  ListToolsRequestSchema,
+} from '@modelcontextprotocol/sdk/types.js';
+import Database from 'better-sqlite3';
+import { searchRegulations, SearchInput } from './search.js';
+import { getSection, GetSectionInput } from './section.js';
+import { listRegulations, ListInput } from './list.js';
+import { compareRequirements, CompareInput } from './compare.js';
+import { mapControls, MapControlsInput } from './map.js';
+import { checkApplicability, ApplicabilityInput } from './applicability.js';
+import { getDefinitions, DefinitionsInput } from './definitions.js';
+import { getEvidenceRequirements, EvidenceInput } from './evidence.js';
+import { getComplianceActionItems, ActionItemsInput } from './action-items.js';
+export interface ToolDefinition {
+  name: string;
+  description: string;
+  inputSchema: any;
+  handler: (db: Database.Database, args: any) => Promise<any>;
+}
+/**
+ * Centralized registry of all MCP tools.
+ * Single source of truth for both stdio and HTTP servers.
+ */
+export const TOOLS: ToolDefinition[] = [
+  {
+    name: 'search_regulations',
+    description: 'Search across all US regulations using full-text search. Returns relevant sections with highlighted snippets. Token-efficient: returns 32-token snippets with >>> <<< markers around matched terms.',
+    inputSchema: {
+      type: 'object',
+      properties: {
+        query: {
+          type: 'string',
+          description: 'Search query (supports natural language and technical terms)',
+        },
+        regulations: {
+          type: 'array',
+          items: { type: 'string' },
+          description: 'Optional: Filter results to specific regulations (e.g., ["HIPAA", "CCPA"])',
+        },
+        limit: {
+          type: 'number',
+          description: 'Maximum number of results to return (default: 10, max: 1000)',
+          default: 10,
+        },
+      },
+      required: ['query'],
+    },
+    handler: async (db: Database.Database, args: any) => {
+      return await searchRegulations(db, args as SearchInput);
+    },
+  },
+  {
+    name: 'get_section',
+    description: 'Retrieve the full text of a specific regulation section. Returns section content, metadata, and cross-references. Large sections are automatically truncated with a warning.',
+    inputSchema: {
+      type: 'object',
+      properties: {
+        regulation: {
+          type: 'string',
+          description: 'Regulation ID (e.g., "HIPAA", "CCPA")',
+        },
+        section: {
+          type: 'string',
+          description: 'Section number (e.g., "164.502", "1798.100")',
+        },
+      },
+      required: ['regulation', 'section'],
+    },
+    handler: async (db: Database.Database, args: any) => {
+      return await getSection(db, args as GetSectionInput);
+    },
+  },
+  {
+    name: 'list_regulations',
+    description: 'List all available regulations or get the structure of a specific regulation. Without parameters, returns all regulations with metadata. With a regulation ID, returns chapters and sections organized hierarchically.',
+    inputSchema: {
+      type: 'object',
+      properties: {
+        regulation: {
+          type: 'string',
+          description: 'Optional: Regulation ID to get detailed structure for (e.g., "HIPAA")',
+        },
+      },
+    },
+    handler: async (db: Database.Database, args: any) => {
+      return await listRegulations(db, args as ListInput);
+    },
+  },
+  {
+    name: 'compare_requirements',
+    description: 'Compare requirements across multiple regulations for a specific topic. Searches each regulation and returns the top matching sections with relevance scores.',
+    inputSchema: {
+      type: 'object',
+      properties: {
+        topic: {
+          type: 'string',
+          description: 'Topic to compare (e.g., "breach notification", "access controls")',
+        },
+        regulations: {
+          type: 'array',
+          items: { type: 'string' },
+          description: 'List of regulations to compare (e.g., ["HIPAA", "CCPA"])',
+        },
+      },
+      required: ['topic', 'regulations'],
+    },
+    handler: async (db: Database.Database, args: any) => {
+      return await compareRequirements(db, args as CompareInput);
+    },
+  },
+  {
+    name: 'map_controls',
+    description: 'Map NIST controls (800-53, CSF) to regulation sections. Shows which regulatory requirements satisfy specific control objectives. Can filter by control ID or regulation.',
+    inputSchema: {
+      type: 'object',
+      properties: {
+        framework: {
+          type: 'string',
+          description: 'Control framework (e.g., "NIST_CSF", "NIST_800_53", "ISO27001")',
+        },
+        control: {
+          type: 'string',
+          description: 'Optional: Specific control ID (e.g., "AC-1", "PR.AC-1")',
+        },
+        regulation: {
+          type: 'string',
+          description: 'Optional: Filter to specific regulation (e.g., "HIPAA")',
+        },
+      },
+      required: ['framework'],
+    },
+    handler: async (db: Database.Database, args: any) => {
+      return await mapControls(db, args as MapControlsInput);
+    },
+  },
+  {
+    name: 'check_applicability',
+    description: 'Determine which regulations apply to a specific sector or subsector. Returns applicable regulations with confidence levels (definite, likely, possible).',
+    inputSchema: {
+      type: 'object',
+      properties: {
+        sector: {
+          type: 'string',
+          description: 'Industry sector (e.g., "healthcare", "financial", "retail", "technology")',
+        },
+        subsector: {
+          type: 'string',
+          description: 'Optional: Specific subsector (e.g., "hospital", "bank", "e-commerce")',
+        },
+      },
+      required: ['sector'],
+    },
+    handler: async (db: Database.Database, args: any) => {
+      return await checkApplicability(db, args as ApplicabilityInput);
+    },
+  },
+  {
+    name: 'get_definitions',
+    description: 'Look up official term definitions across regulations. Uses partial matching to find terms (e.g., "health" matches "protected health information").',
+    inputSchema: {
+      type: 'object',
+      properties: {
+        term: {
+          type: 'string',
+          description: 'Term to look up (e.g., "protected health information", "personal data")',
+        },
+        regulation: {
+          type: 'string',
+          description: 'Optional: Filter to specific regulation (e.g., "HIPAA")',
+        },
+      },
+      required: ['term'],
+    },
+    handler: async (db: Database.Database, args: any) => {
+      return await getDefinitions(db, args as DefinitionsInput);
+    },
+  },
+  {
+    name: 'get_evidence_requirements',
+    description: 'Get compliance evidence requirements for a specific section (e.g., audit logs, policies, procedures). MVP: Returns placeholder until evidence data is seeded.',
+    inputSchema: {
+      type: 'object',
+      properties: {
+        regulation: {
+          type: 'string',
+          description: 'Regulation ID (e.g., "HIPAA")',
+        },
+        section: {
+          type: 'string',
+          description: 'Section number (e.g., "164.312(b)")',
+        },
+      },
+      required: ['regulation', 'section'],
+    },
+    handler: async (db: Database.Database, args: any) => {
+      return await getEvidenceRequirements(db, args as EvidenceInput);
+    },
+  },
+  {
+    name: 'get_compliance_action_items',
+    description: 'Generate structured compliance action items from regulation sections. Extracts priority (high/medium/low) based on regulatory language and identifies evidence needed.',
+    inputSchema: {
+      type: 'object',
+      properties: {
+        regulation: {
+          type: 'string',
+          description: 'Regulation ID (e.g., "HIPAA", "CCPA")',
+        },
+        sections: {
+          type: 'array',
+          items: { type: 'string' },
+          description: 'Section numbers to generate action items for (e.g., ["164.308(a)(1)(ii)(A)", "164.312(b)"])',
+        },
+      },
+      required: ['regulation', 'sections'],
+    },
+    handler: async (db: Database.Database, args: any) => {
+      return await getComplianceActionItems(db, args as ActionItemsInput);
+    },
+  },
+];
+/**
+ * Register all tools with an MCP server instance.
+ * Use this for both stdio and HTTP servers to ensure parity.
+ */
+export function registerTools(server: Server, db: Database.Database): void {
+  // List available tools
+  server.setRequestHandler(ListToolsRequestSchema, async () => ({
+    tools: TOOLS.map(tool => ({
+      name: tool.name,
+      description: tool.description,
+      inputSchema: tool.inputSchema,
+    })),
+  }));
+  // Handle tool calls
+  server.setRequestHandler(CallToolRequestSchema, async (request) => {
+    const { name, arguments: args } = request.params;
+    const tool = TOOLS.find(t => t.name === name);
+    if (!tool) {
+      return {
+        content: [{ type: 'text', text: `Unknown tool: ${name}` }],
+        isError: true,
+      };
+    }
+    try {
+      const result = await tool.handler(db, args || {});
+      return {
+        content: [
+          {
+            type: 'text',
+            text: typeof result === 'string' ? result : JSON.stringify(result, null, 2),
+          },
+        ],
+      };
+    } catch (error) {
+      return {
+        content: [
+          {
+            type: 'text',
+            text: `Error: ${error instanceof Error ? error.message : 'Unknown error'}`,
+          },
+        ],
+        isError: true,
+      };
+    }
+  });
+}

package/src/tools/search.ts ADDED Viewed

@@ -0,0 +1,132 @@
+import type { Database } from 'better-sqlite3';
+export interface SearchInput {
+  query: string;
+  regulations?: string[];
+  limit?: number;
+}
+export interface SearchResult {
+  regulation: string;
+  section: string;
+  title: string;
+  snippet: string;
+  relevance: number;
+}
+/**
+ * Escape special FTS5 query characters and build optimal search query.
+ * Uses adaptive logic:
+ * - Short queries (1-3 words): AND logic with exact matching for precision
+ * - Long queries (4+ words): OR logic with prefix matching for recall
+ * This prevents empty results on complex queries while maintaining precision on simple ones.
+ *
+ * Handles hyphenated terms by converting them to spaces (e.g., "third-party" → "third party")
+ * to avoid FTS5 syntax errors where hyphens are interpreted as operators.
+ */
+function escapeFts5Query(query: string): string {
+  // Common stopwords that add noise to searches
+  const stopwords = new Set(['a', 'an', 'the', 'and', 'or', 'but', 'in', 'on', 'at', 'to', 'for', 'of', 'with', 'by']);
+  // Normalize query: remove quotes, convert hyphens to spaces
+  // This allows "third-party" to become "third party" which FTS5 handles naturally
+  const words = query
+    .replace(/['"]/g, '') // Remove quotes
+    .replace(/-/g, ' ') // Convert hyphens to spaces (fixes "third-party" → "third party")
+    .split(/\s+/)
+    .filter(word => word.length > 2 && !stopwords.has(word.toLowerCase())); // Filter short words and stopwords
+  if (words.length === 0) {
+    return '';
+  }
+  if (words.length <= 2) {
+    // Short queries (1-2 words): Use AND logic with prefix matching for precision
+    // Example: "incident reporting" → incident* reporting*
+    // Prefix matching handles word variations (encrypt vs encryption)
+    return words.map(word => `${word}*`).join(' ');
+  } else {
+    // Long queries (3+ words): Use OR logic with prefix matching for better recall
+    // Example: "encryption transmission storage" → encryption* OR transmission* OR storage*
+    // BM25 will still rank documents with more matches higher
+    return words.map(word => `${word}*`).join(' OR ');
+  }
+}
+export async function searchRegulations(
+  db: Database,
+  input: SearchInput
+): Promise<SearchResult[]> {
+  let { query, regulations, limit = 10 } = input;
+  // Validate and sanitize limit parameter
+  if (!Number.isFinite(limit) || limit < 0) {
+    limit = 10; // Default to safe value
+  }
+  // Cap at reasonable maximum
+  limit = Math.min(Math.floor(limit), 1000);
+  if (!query || query.trim().length === 0) {
+    throw new Error('Query cannot be empty. Please provide a search term.');
+  }
+  const escapedQuery = escapeFts5Query(query);
+  if (!escapedQuery) {
+    return [];
+  }
+  const params: (string | number)[] = [escapedQuery];
+  // Build optional regulation filter
+  let regulationFilter = '';
+  if (regulations && regulations.length > 0) {
+    const placeholders = regulations.map(() => '?').join(', ');
+    regulationFilter = ` AND regulation IN (${placeholders})`;
+    params.push(...regulations);
+  }
+  // Search in sections
+  const sectionsQuery = `
+    SELECT
+      sections_fts.regulation,
+      sections_fts.section_number as section,
+      sections_fts.title,
+      snippet(sections_fts, 3, '>>>', '<<<', '...', 32) as snippet,
+      bm25(sections_fts) as relevance
+    FROM sections_fts
+    WHERE sections_fts MATCH ?
+    ${regulationFilter}
+    ORDER BY bm25(sections_fts)
+    LIMIT ?
+  `;
+  try {
+    // Execute query
+    const sectionsParams = [...params, limit];
+    const sectionStmt = db.prepare(sectionsQuery);
+    const sectionRows = sectionStmt.all(...sectionsParams) as Array<{
+      regulation: string;
+      section: string;
+      title: string;
+      snippet: string;
+      relevance: number;
+    }>;
+    // BM25 returns negative scores; convert to positive for clarity
+    const results = sectionRows.map(row => ({
+      ...row,
+      relevance: Math.abs(row.relevance),
+    }));
+    return results;
+  } catch (error) {
+    // If FTS5 query fails (e.g., syntax error), return empty results
+    if (error instanceof Error && error.message.includes('fts5')) {
+      return [];
+    }
+    throw error;
+  }
+}

package/src/tools/section.ts ADDED Viewed

@@ -0,0 +1,85 @@
+import type { Database } from 'better-sqlite3';
+export interface GetSectionInput {
+  regulation: string;
+  section: string;
+}
+export interface SectionData {
+  regulation: string;
+  section_number: string;
+  title: string | null;
+  text: string;
+  chapter: string | null;
+  parent_section: string | null;
+  cross_references: string[] | null;
+  truncated?: boolean;
+  original_length?: number;
+  token_estimate?: number;
+}
+export async function getSection(
+  db: Database,
+  input: GetSectionInput
+): Promise<SectionData | null> {
+  const { regulation, section } = input;
+  const sql = `
+    SELECT
+      regulation,
+      section_number,
+      title,
+      text,
+      chapter,
+      parent_section,
+      cross_references
+    FROM sections
+    WHERE regulation = ? AND section_number = ?
+  `;
+  const row = db.prepare(sql).get(regulation, section) as {
+    regulation: string;
+    section_number: string;
+    title: string | null;
+    text: string;
+    chapter: string | null;
+    parent_section: string | null;
+    cross_references: string | null;
+  } | undefined;
+  if (!row) {
+    return null;
+  }
+  // Token management: Truncate very large sections to prevent context overflow
+  const MAX_CHARS = 50000; // ~12,500 tokens (safe for 200k context window)
+  const originalLength = row.text.length;
+  const tokenEstimate = Math.ceil(originalLength / 4); // ~4 chars per token
+  let text = row.text;
+  let truncated = false;
+  if (originalLength > MAX_CHARS) {
+    text = row.text.substring(0, MAX_CHARS) + '\n\n[... Section truncated due to length. Original: ' + originalLength + ' chars (~' + tokenEstimate + ' tokens). Use search_regulations to find specific content.]';
+    truncated = true;
+  }
+  return {
+    regulation: row.regulation,
+    section_number: row.section_number,
+    title: row.title,
+    text,
+    chapter: row.chapter,
+    parent_section: row.parent_section,
+    cross_references: row.cross_references ? (() => {
+      try {
+        return JSON.parse(row.cross_references);
+      } catch {
+        console.warn(`Invalid cross_references JSON for ${row.regulation} ${row.section_number}`);
+        return null;
+      }
+    })() : null,
+    truncated,
+    original_length: truncated ? originalLength : undefined,
+    token_estimate: truncated ? tokenEstimate : undefined,
+  };
+}