npm - @kiyeonjeon21/datacontext - Versions diffs - 0.2.0 → 0.3.0 - Mend

@kiyeonjeon21/datacontext 0.2.0 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (51) hide show

package/.cursorrules +12 -0
package/.env.example +8 -0
package/.github/workflows/ci.yml +21 -1
package/.github/workflows/publish.yml +21 -1
package/CHANGELOG.md +41 -0
package/README.md +247 -239
package/datacontext.db +0 -0
package/dist/api/server.d.ts.map +1 -1
package/dist/api/server.js +145 -0
package/dist/api/server.js.map +1 -1
package/dist/api/start-server.d.ts +10 -0
package/dist/api/start-server.d.ts.map +1 -0
package/dist/api/start-server.js +73 -0
package/dist/api/start-server.js.map +1 -0
package/dist/cli/index.js +462 -0
package/dist/cli/index.js.map +1 -1
package/dist/core/context-service.d.ts +58 -0
package/dist/core/context-service.d.ts.map +1 -1
package/dist/core/context-service.js +121 -0
package/dist/core/context-service.js.map +1 -1
package/dist/core/index.d.ts +2 -0
package/dist/core/index.d.ts.map +1 -1
package/dist/core/index.js +5 -1
package/dist/core/index.js.map +1 -1
package/dist/core/llm-service.d.ts +141 -0
package/dist/core/llm-service.d.ts.map +1 -0
package/dist/core/llm-service.js +284 -0
package/dist/core/llm-service.js.map +1 -0
package/dist/knowledge/store.d.ts +56 -3
package/dist/knowledge/store.d.ts.map +1 -1
package/dist/knowledge/store.js +193 -7
package/dist/knowledge/store.js.map +1 -1
package/dist/knowledge/types.d.ts +43 -1
package/dist/knowledge/types.d.ts.map +1 -1
package/dist/knowledge/types.js.map +1 -1
package/dist/mcp/tools.d.ts.map +1 -1
package/dist/mcp/tools.js +365 -0
package/dist/mcp/tools.js.map +1 -1
package/docs/API.md +173 -0
package/docs/DEMO_SCRIPT.md +210 -0
package/docs/SYNC_GUIDE.md +242 -0
package/package.json +4 -1
package/src/api/server.ts +160 -0
package/src/api/start-server.ts +78 -0
package/src/cli/index.ts +534 -0
package/src/core/context-service.ts +157 -0
package/src/core/index.ts +7 -0
package/src/core/llm-service.ts +359 -0
package/src/knowledge/store.ts +232 -7
package/src/knowledge/types.ts +45 -1
package/src/mcp/tools.ts +415 -0

package/src/mcp/tools.ts CHANGED Viewed

@@ -263,6 +263,98 @@ export function getMcpTools(): Tool[] {
         required: ['name', 'description', 'tables'],
       },
     },
+    // === Glossary Tools ===
+    {
+      name: 'generate_glossary',
+      description: 'Generate business glossary/terms from user input using AI. Takes natural language term definitions and creates structured SQL-ready glossary entries. Requires ANTHROPIC_API_KEY to be set.',
+      inputSchema: {
+        type: 'object',
+        properties: {
+          terms: {
+            type: 'string',
+            description: 'Raw term definitions in natural language. Can be comma-separated, one per line, or structured (YAML-like). Example: "활성 사용자 = status가 1인 사용자\\n최근 주문 = 30일 이내 주문\\nVIP = 주문 10건 이상"',
+          },
+        },
+        required: ['terms'],
+      },
+    },
+    {
+      name: 'add_term',
+      description: 'Add a single business term to the glossary manually.',
+      inputSchema: {
+        type: 'object',
+        properties: {
+          term: {
+            type: 'string',
+            description: 'The business term (e.g., "활성 사용자", "active user").',
+          },
+          definition: {
+            type: 'string',
+            description: 'Human-readable definition of the term.',
+          },
+          sql: {
+            type: 'string',
+            description: 'SQL expression for this term (e.g., "status = 1").',
+          },
+          synonyms: {
+            type: 'array',
+            items: { type: 'string' },
+            description: 'Alternative names for this term.',
+          },
+          tables: {
+            type: 'array',
+            items: { type: 'string' },
+            description: 'Tables this term applies to.',
+          },
+        },
+        required: ['term', 'definition'],
+      },
+    },
+    {
+      name: 'list_terms',
+      description: 'List all business terms in the glossary.',
+      inputSchema: {
+        type: 'object',
+        properties: {
+          category: {
+            type: 'string',
+            description: 'Filter by category (status, time, money, entity, metric, filter, custom).',
+          },
+          table: {
+            type: 'string',
+            description: 'Filter by table name.',
+          },
+        },
+      },
+    },
+    {
+      name: 'search_terms',
+      description: 'Search for business terms that match a query. Useful for finding relevant terms before generating SQL.',
+      inputSchema: {
+        type: 'object',
+        properties: {
+          query: {
+            type: 'string',
+            description: 'Search query to match against term names and synonyms.',
+          },
+        },
+        required: ['query'],
+      },
+    },
+    {
+      name: 'enhance_query',
+      description: 'Enhance a natural language query by matching it against the business glossary. Returns suggested SQL conditions based on matched terms. Requires ANTHROPIC_API_KEY.',
+      inputSchema: {
+        type: 'object',
+        properties: {
+          query: {
+            type: 'string',
+            description: 'Natural language query to enhance (e.g., "활성 사용자 중 최근 주문한 VIP 고객")',
+          },
+        },
+        required: ['query'],
+      },
+    },
   ];
 }
@@ -298,6 +390,17 @@ export async function handleToolCall(
       return handleAddQueryExample(args, context);
     case 'add_business_rule':
       return handleAddBusinessRule(args, context);
+    // === Glossary Tools ===
+    case 'generate_glossary':
+      return handleGenerateGlossary(args, context);
+    case 'add_term':
+      return handleAddTerm(args, context);
+    case 'list_terms':
+      return handleListTerms(args, context);
+    case 'search_terms':
+      return handleSearchTerms(args, context);
+    case 'enhance_query':
+      return handleEnhanceQuery(args, context);
     default:
       throw new Error(`Unknown tool: ${name}`);
   }
@@ -820,6 +923,318 @@ async function handleAddBusinessRule(
   };
 }
+// ============================================================
+// Glossary Tool Handlers
+// ============================================================
+/**
+ * Handle generate_glossary tool - AI-powered glossary generation
+ */
+async function handleGenerateGlossary(
+  args: Record<string, unknown>,
+  context: ToolContext
+): Promise<unknown> {
+  const terms = args.terms as string;
+  if (!terms) {
+    throw new Error('terms is required');
+  }
+  // Check if LLM is available
+  const { isLLMAvailable, createLLMService } = await import('../core/llm-service.js');
+  if (!isLLMAvailable()) {
+    return {
+      success: false,
+      error: 'ANTHROPIC_API_KEY not configured. Set the environment variable to use AI-powered glossary generation.',
+      tip: 'You can still add terms manually using the add_term tool.',
+    };
+  }
+  try {
+    // Get schema context
+    const schemaInfo = await context.adapter.getSchema();
+    const schemaContext = {
+      tables: schemaInfo.tables.slice(0, 20).map(table => ({
+        name: table.name,
+        columns: table.columns.map(c => ({
+          name: c.name,
+          type: c.dataType,
+          nullable: c.isNullable,
+        })),
+      })),
+      existingTerms: context.knowledge.getBusinessTerms(),
+    };
+    const llm = createLLMService();
+    const generatedTerms = await llm.generateGlossary(
+      terms,
+      schemaContext,
+      context.knowledge.getSchemaHash()
+    );
+    // Add to knowledge store
+    const added = await context.knowledge.addBusinessTerms(generatedTerms);
+    return {
+      success: true,
+      generated: added.length,
+      terms: added.map(t => ({
+        term: t.term,
+        definition: t.definition,
+        sql: t.sqlExpression,
+        category: t.category,
+        tables: t.appliesTo?.tables,
+      })),
+      message: `Generated and added ${added.length} business term(s) to glossary.`,
+      tip: 'These terms will now be used to enhance query understanding.',
+    };
+  } catch (error) {
+    return {
+      success: false,
+      error: error instanceof Error ? error.message : String(error),
+      tip: 'Check your API key and try again with simpler term definitions.',
+    };
+  }
+}
+/**
+ * Handle add_term tool - manual term addition
+ */
+async function handleAddTerm(
+  args: Record<string, unknown>,
+  context: ToolContext
+): Promise<unknown> {
+  const term = args.term as string;
+  const definition = args.definition as string;
+  const sql = args.sql as string | undefined;
+  const synonyms = args.synonyms as string[] | undefined;
+  const tables = args.tables as string[] | undefined;
+  if (!term) throw new Error('term is required');
+  if (!definition) throw new Error('definition is required');
+  const added = await context.knowledge.addBusinessTerm(term, definition, {
+    sqlExpression: sql,
+    synonyms,
+    appliesTo: tables ? { tables } : undefined,
+  });
+  return {
+    success: true,
+    term: added.term,
+    definition: added.definition,
+    sql: added.sqlExpression,
+    synonyms: added.synonyms,
+    tables: added.appliesTo?.tables,
+    message: `Added term "${term}" to glossary.`,
+    tip: 'This term will be used in query context when relevant.',
+  };
+}
+/**
+ * Handle list_terms tool
+ */
+async function handleListTerms(
+  args: Record<string, unknown>,
+  context: ToolContext
+): Promise<unknown> {
+  const category = args.category as string | undefined;
+  const table = args.table as string | undefined;
+  let terms = context.knowledge.getActiveTerms();
+  // Apply filters
+  if (category) {
+    terms = terms.filter(t => t.category === category);
+  }
+  if (table) {
+    terms = terms.filter(t => t.appliesTo?.tables?.includes(table));
+  }
+  if (terms.length === 0) {
+    return {
+      count: 0,
+      terms: [],
+      message: 'No business terms found.',
+      tip: 'Add terms using add_term or generate_glossary.',
+    };
+  }
+  return {
+    count: terms.length,
+    terms: terms.map(t => ({
+      id: t.id,
+      term: t.term,
+      synonyms: t.synonyms,
+      definition: t.definition,
+      sql: t.sqlExpression,
+      category: t.category,
+      tables: t.appliesTo?.tables,
+      isActive: t.isActive,
+    })),
+    categories: [...new Set(terms.map(t => t.category).filter(Boolean))],
+  };
+}
+/**
+ * Handle search_terms tool
+ */
+async function handleSearchTerms(
+  args: Record<string, unknown>,
+  context: ToolContext
+): Promise<unknown> {
+  const query = args.query as string;
+  if (!query) {
+    throw new Error('query is required');
+  }
+  const terms = context.knowledge.findMatchingTerms(query);
+  if (terms.length === 0) {
+    return {
+      count: 0,
+      terms: [],
+      message: `No terms found matching "${query}".`,
+      tip: 'Try a broader search or check available terms with list_terms.',
+    };
+  }
+  return {
+    query,
+    count: terms.length,
+    terms: terms.map(t => ({
+      term: t.term,
+      synonyms: t.synonyms,
+      definition: t.definition,
+      sql: t.sqlExpression,
+      category: t.category,
+      relevance: calculateTermRelevance(query, t),
+    })),
+    suggestedConditions: terms
+      .filter(t => t.sqlExpression)
+      .map(t => t.sqlExpression as string),
+    message: `Found ${terms.length} term(s) matching "${query}".`,
+  };
+}
+/**
+ * Handle enhance_query tool - AI-powered query enhancement
+ */
+async function handleEnhanceQuery(
+  args: Record<string, unknown>,
+  context: ToolContext
+): Promise<unknown> {
+  const query = args.query as string;
+  if (!query) {
+    throw new Error('query is required');
+  }
+  // First try local matching (no LLM)
+  const localMatches = context.knowledge.findMatchingTerms(query);
+  if (localMatches.length > 0) {
+    const suggestedConditions = localMatches
+      .filter(t => t.sqlExpression)
+      .map(t => t.sqlExpression as string);
+    return {
+      success: true,
+      method: 'local',
+      query,
+      enhancedQuery: query,
+      usedTerms: localMatches.map(t => t.term),
+      suggestedConditions,
+      terms: localMatches.map(t => ({
+        term: t.term,
+        sql: t.sqlExpression,
+        category: t.category,
+      })),
+      tip: 'Use these SQL conditions in your WHERE clause.',
+    };
+  }
+  // Try LLM enhancement if available
+  const { isLLMAvailable, createLLMService } = await import('../core/llm-service.js');
+  if (!isLLMAvailable()) {
+    return {
+      success: true,
+      method: 'local',
+      query,
+      enhancedQuery: query,
+      usedTerms: [],
+      suggestedConditions: [],
+      message: 'No matching terms found locally. Configure ANTHROPIC_API_KEY for AI-powered enhancement.',
+    };
+  }
+  try {
+    const terms = context.knowledge.getActiveTerms();
+    if (terms.length === 0) {
+      return {
+        success: true,
+        method: 'local',
+        query,
+        enhancedQuery: query,
+        usedTerms: [],
+        suggestedConditions: [],
+        message: 'No terms in glossary. Add terms using add_term or generate_glossary.',
+      };
+    }
+    const llm = createLLMService();
+    const result = await llm.enhanceQueryWithGlossary(query, terms);
+    return {
+      success: true,
+      method: 'ai',
+      query,
+      enhancedQuery: result.enhancedQuery,
+      usedTerms: result.usedTerms,
+      suggestedConditions: result.suggestedConditions,
+      message: result.usedTerms.length > 0
+        ? `Found ${result.usedTerms.length} matching term(s): ${result.usedTerms.join(', ')}`
+        : 'No matching terms found.',
+      tip: 'Apply suggestedConditions to your SQL WHERE clause.',
+    };
+  } catch (error) {
+    return {
+      success: false,
+      error: error instanceof Error ? error.message : String(error),
+      tip: 'Fallback to local term matching.',
+    };
+  }
+}
+/**
+ * Calculate term relevance score
+ */
+function calculateTermRelevance(query: string, term: { term: string; synonyms: string[] }): number {
+  const lowerQuery = query.toLowerCase();
+  const lowerTerm = term.term.toLowerCase();
+  // Exact match = 1.0
+  if (lowerTerm === lowerQuery) return 1.0;
+  // Term contains query = 0.8
+  if (lowerTerm.includes(lowerQuery)) return 0.8;
+  // Query contains term = 0.7
+  if (lowerQuery.includes(lowerTerm)) return 0.7;
+  // Synonym match
+  for (const syn of term.synonyms) {
+    if (syn.toLowerCase() === lowerQuery) return 0.9;
+    if (syn.toLowerCase().includes(lowerQuery)) return 0.6;
+  }
+  return 0.5;
+}
 // ============================================================
 // Utility Functions
 // ============================================================