npm - @malloydata/db-snowflake - Versions diffs - 0.0.375 → 0.0.377 - Mend

@malloydata/db-snowflake 0.0.375 → 0.0.377

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

package/dist/index.js +29 -2
package/dist/index.js.map +1 -1
package/dist/snowflake_connection.d.ts +48 -13
package/dist/snowflake_connection.js +144 -228
package/dist/snowflake_connection.js.map +1 -1
package/dist/snowflake_connection.spec.js +179 -14
package/dist/snowflake_connection.spec.js.map +1 -1
package/dist/snowflake_sample_strategy.spec.js +97 -0
package/dist/snowflake_sample_strategy.spec.js.map +1 -0
package/dist/snowflake_table_name.d.ts +19 -0
package/dist/snowflake_table_name.js +80 -0
package/dist/snowflake_table_name.js.map +1 -0
package/dist/snowflake_variant_schema.d.ts +43 -0
package/dist/snowflake_variant_schema.js +203 -0
package/dist/snowflake_variant_schema.js.map +1 -0
package/dist/snowflake_variant_schema.spec.js +150 -0
package/dist/snowflake_variant_schema.spec.js.map +1 -0
package/package.json +2 -2
package/src/index.ts +34 -1
package/src/snowflake_connection.spec.ts +219 -15
package/src/snowflake_connection.ts +218 -262
package/src/snowflake_sample_strategy.spec.ts +130 -0
package/src/snowflake_table_name.ts +94 -0
package/src/snowflake_variant_schema.spec.ts +188 -0
package/src/snowflake_variant_schema.ts +301 -0
package/dist/snowflake_executor.spec.js +0 -89
package/dist/snowflake_executor.spec.js.map +0 -1
package/dist/snowflake_setup.spec.js +0 -76
package/dist/snowflake_setup.spec.js.map +0 -1
package/src/snowflake_executor.spec.ts +0 -103
package/src/snowflake_setup.spec.ts +0 -56
/package/dist/{snowflake_executor.spec.d.ts → snowflake_sample_strategy.spec.d.ts} +0 -0
/package/dist/{snowflake_setup.spec.d.ts → snowflake_variant_schema.spec.d.ts} +0 -0

package/src/snowflake_connection.ts CHANGED Viewed

@@ -34,27 +34,69 @@ import type {
   StructDef,
   QueryRecord,
   TestableConnection,
-  Dialect,
-  RecordDef,
-  AtomicFieldDef,
-  ArrayDef,
   SQLSourceRequest,
 } from '@malloydata/malloy';
-import {
-  SnowflakeDialect,
-  TinyParser,
-  mkArrayDef,
-  sqlKey,
-  makeDigest,
-} from '@malloydata/malloy';
+import {SnowflakeDialect, sqlKey, makeDigest} from '@malloydata/malloy';
 import {BaseConnection} from '@malloydata/malloy/connection';
 import {SnowflakeExecutor} from './snowflake_executor';
+import {
+  accumulateVariantPath,
+  buildTopLevelField,
+  createVariantSchemaState,
+  PathParser,
+  seedTopLevelShape,
+} from './snowflake_variant_schema';
+import type {NestedColumn} from './snowflake_variant_schema';
+import {parseSnowflakeTableName} from './snowflake_table_name';
 import type {ConnectionOptions} from 'snowflake-sdk';
 import type {Options as PoolOptions} from 'generic-pool';
 type namespace = {database: string; schema: string};
+/**
+ * Output of the INFORMATION_SCHEMA.TABLES probe. Undefined when the
+ * probe didn't run (non-parseable name) or couldn't find numeric size
+ * info (views, missing permissions).
+ */
+export interface TableSizeProbe {
+  bytes: number;
+  rowCount: number;
+}
+/**
+ * Three-way tier that drives variant schema sampling. Extracted as a
+ * pure function so cost-policy decisions are unit-testable.
+ *
+ *   full-scan-then-sample: probe confirmed a small base table. One
+ *     full scan catches rare fields. On failure, fall through to the
+ *     sample chain rather than accept opaque variant.
+ *
+ *   tablesample-only: probe confirmed a base table above the small
+ *     threshold. TABLESAMPLE BLOCK is safe (reads a few micro
+ *     partitions). Plain LIMIT without a WHERE is unsafe on large
+ *     partitioned tables, so we skip the LIMIT fallback — we'd rather
+ *     degrade to variant than issue a runaway query.
+ *
+ *   tablesample-then-limit: probe gave no size info (views, temp
+ *     views, exotic names). We can't distinguish a small view from a
+ *     view over a petabyte table, so we do best-effort sampling. This
+ *     is the acknowledged "can't help you" case from the design doc.
+ */
+export type SampleStrategy =
+  | 'full-scan-then-sample'
+  | 'tablesample-only'
+  | 'tablesample-then-limit';
+export function pickSampleStrategy(
+  probe: TableSizeProbe | undefined,
+  fullScanMaxBytes: number
+): SampleStrategy {
+  if (probe === undefined) return 'tablesample-then-limit';
+  if (probe.bytes <= fullScanMaxBytes) return 'full-scan-then-sample';
+  return 'tablesample-only';
+}
 export interface SnowflakeConnectionOptions {
   // snowflake sdk connection options
   connOptions?: ConnectionOptions;
@@ -74,155 +116,18 @@ export interface SnowflakeConnectionOptions {
   // Timeout for the variant schema sampling query (default 2 minutes)
   schemaSampleTimeoutMs?: number;
-  // SQL statements to run when a connection is acquired from the pool
-  setupSQL?: string;
-}
-type PathChain =
-  | {arrayRef: true; next?: PathChain}
-  | {name: string; next?: PathChain};
-class SnowField {
-  constructor(
-    readonly name: string,
-    readonly type: string,
-    readonly dialect: Dialect
-  ) {}
-  fieldDef(): AtomicFieldDef {
-    return {
-      ...this.dialect.sqlTypeToMalloyType(this.type),
-      name: this.name,
-    };
-  }
-  walk(_path: PathChain, _fieldType: string): void {
-    throw new Error(
-      'SNOWWFLAKE SCHEMA PARSE ERROR: Should not walk through fields'
-    );
-  }
-  static make(name: string, fieldType: string, d: Dialect) {
-    if (fieldType === 'array') {
-      return new SnowArray(name, d);
-    } else if (fieldType === 'object') {
-      return new SnowObject(name, d);
-    }
-    return new SnowField(name, fieldType, d);
-  }
-}
-class SnowObject extends SnowField {
-  fieldMap = new Map<string, SnowField>();
-  constructor(name: string, d: Dialect) {
-    super(name, 'object', d);
-  }
-  get fields(): AtomicFieldDef[] {
-    const fields: AtomicFieldDef[] = [];
-    for (const [_, fieldObj] of this.fieldMap) {
-      fields.push(fieldObj.fieldDef());
-    }
-    return fields;
-  }
-  fieldDef(): RecordDef {
-    const rec: RecordDef = {
-      type: 'record',
-      name: this.name,
-      fields: this.fields,
-      join: 'one',
-    };
-    return rec;
-  }
-  walk(path: PathChain, fieldType: string) {
-    if ('name' in path) {
-      const field = this.fieldMap.get(path.name);
-      if (path.next) {
-        if (field instanceof SnowObject || field instanceof SnowArray) {
-          field.walk(path.next, fieldType);
-          return;
-        }
-        // Field is missing or is a scalar leaf — the variant data has
-        // inconsistent structure across rows. Degrade to opaque variant.
-        this.fieldMap.set(
-          path.name,
-          new SnowField(path.name, 'variant', this.dialect)
-        );
-        return;
-      } else {
-        if (!field) {
-          this.fieldMap.set(
-            path.name,
-            SnowField.make(path.name, fieldType, this.dialect)
-          );
-          return;
-        }
-      }
-      return;
-    }
-    // Array reference in an object context — inconsistent structure.
-    // Ignore this path; the object keeps whatever fields it already has.
-  }
-}
-class SnowArray extends SnowField {
-  arrayOf = 'unknown';
-  objectChild?: SnowObject;
-  arrayChild?: SnowArray;
-  constructor(name: string, d: Dialect) {
-    super(name, 'array', d);
-  }
-  isArrayOf(type: string) {
-    if (this.arrayOf !== 'unknown') {
-      this.arrayOf = 'variant';
-      return;
-    }
-    this.arrayOf = type;
-    if (type === 'object') {
-      this.objectChild = new SnowObject('', this.dialect);
-    } else if (type === 'array') {
-      this.arrayChild = new SnowArray('', this.dialect);
-    }
-  }
+  // Row limit used inside the variant schema sample (default 1000). When the
+  // probe reports the table is small enough to full-scan, this limit is
+  // ignored.
+  schemaSampleRowLimit?: number;
-  fieldDef(): ArrayDef {
-    if (this.objectChild) {
-      const t = mkArrayDef(
-        {type: 'record', fields: this.objectChild.fields},
-        this.name
-      );
-      return t;
-    }
-    if (this.arrayChild) {
-      return mkArrayDef(this.arrayChild.fieldDef(), this.name);
-    }
-    return mkArrayDef(
-      this.dialect.sqlTypeToMalloyType(this.arrayOf),
-      this.name
-    );
-  }
+  // Byte threshold below which variant schema inference skips sampling and
+  // full-scans the table instead (default 100 MB). A full scan catches rare
+  // fields that a sample would miss.
+  schemaSampleFullScanMaxBytes?: number;
-  walk(path: PathChain, fieldType: string) {
-    if ('arrayRef' in path) {
-      if (path.next) {
-        const next = this.arrayChild || this.objectChild;
-        if (next) {
-          next.walk(path.next, fieldType);
-          return;
-        }
-        // Array elements were scalars but now we see deeper structure —
-        // inconsistent variant data. Degrade to variant array.
-        this.arrayOf = 'variant';
-        return;
-      } else {
-        this.isArrayOf(fieldType);
-        return;
-      }
-    }
-    // Name reference in an array context — inconsistent structure.
-    // Degrade to variant array.
-    this.arrayOf = 'variant';
-  }
+  // SQL statements to run when a connection is acquired from the pool
+  setupSQL?: string;
 }
 /**
@@ -248,6 +153,8 @@ export class SnowflakeConnection
   private queryOptions: RunSQLOptions;
   private timeoutMs: number;
   private schemaSampleTimeoutMs: number;
+  private schemaSampleRowLimit: number;
+  private schemaSampleFullScanMaxBytes: number;
   private setupSQL: string | undefined;
   constructor(
@@ -271,6 +178,9 @@ export class SnowflakeConnection
     this.queryOptions = options?.queryOptions ?? {};
     this.timeoutMs = options?.timeoutMs ?? TIMEOUT_MS;
     this.schemaSampleTimeoutMs = options?.schemaSampleTimeoutMs ?? 15_000;
+    this.schemaSampleRowLimit = options?.schemaSampleRowLimit ?? 1000;
+    this.schemaSampleFullScanMaxBytes =
+      options?.schemaSampleFullScanMaxBytes ?? 100_000_000;
   }
   get dialectName(): string {
@@ -366,7 +276,7 @@ export class SnowflakeConnection
   ): Promise<void> {
     const infoQuery = `DESCRIBE TABLE ${tablePath}`;
     const rows = await this.executor.batch(infoQuery);
-    const variants: string[] = [];
+    const nestedColumns: NestedColumn[] = [];
     const notVariant = new Map<string, boolean>();
     for (const row of rows) {
       // data types look like `VARCHAR(1234)` or `NUMBER(10,2)`
@@ -374,8 +284,12 @@ export class SnowflakeConnection
       const baseType = fullType.split('(')[0];
       const name = row['name'] as string;
-      if (['variant', 'array', 'object'].includes(baseType)) {
-        variants.push(name);
+      if (
+        baseType === 'variant' ||
+        baseType === 'array' ||
+        baseType === 'object'
+      ) {
+        nestedColumns.push({kind: baseType, name});
       } else {
         notVariant.set(name, true);
         // For NUMBER types, pass full string so dialect can inspect scale
@@ -390,74 +304,167 @@ export class SnowflakeConnection
       }
     }
     // VARIANT, ARRAY, and OBJECT columns don't have schema in metadata —
-    // we have to sample actual data and inspect it to discover the structure.
-    // This is inherently heuristic (we only look at 100 rows) and can be
-    // slow on large partitioned tables or expensive views.
-    if (variants.length > 0) {
-      const variantArgs = variants.map(v => `'${v}', "${v}"`).join(', ');
-      // Build the analysis query that flattens sampled rows and detects
-      // the type of each leaf path. We only construct from variant columns
-      // (not *) to avoid flattening the entire row on wide tables.
-      // Paths with multiple types across the sample are dropped (HAVING
-      // count(*) <= 1), and nulls are ignored.
+    // we have to sample actual data and inspect it to discover the
+    // structure. Cost control happens in two places:
+    //   1. project only the nested columns (via object_construct), so
+    //      bytes-on-wire are bounded by actual variant content.
+    //   2. tier the sampling strategy by probeTableSize (see
+    //      pickSampleStrategy) — small base tables get a full scan;
+    //      large base tables get TABLESAMPLE only (no unsafe LIMIT
+    //      fallback); unknown-size sources (views, temp views) get
+    //      the best-effort TABLESAMPLE→LIMIT chain.
+    if (nestedColumns.length > 0) {
+      const variantArgs = nestedColumns
+        .map(v => `'${v.name}', "${v.name}"`)
+        .join(', ');
+      // Flatten sampled rows and emit each distinct (path, type) pair.
+      // Conflicting pairs at the same path flow through to mergeShape,
+      // which collapses them to variant — that is how we honestly
+      // surface mixed-type fields to the user.
       const makeSampleQuery = (sampleClause: string) => `
-        select path, min(type) as type
-        from (
-          select
-            regexp_replace(path, '\\\\[[0-9]+\\\\]', '[*]') as path,
-            case
-              when typeof(value) = 'INTEGER' then 'decimal'
-              when typeof(value) = 'DOUBLE' then 'decimal'
-            else lower(typeof(value)) end as type
-          from
-            (${sampleClause})
-              ,table(flatten(input => o, recursive => true)) as meta
-          group by 1,2
-        )
-        where type != 'null_value'
-        group BY 1
-        having count(*) <=1
-        order by path;
+        select
+          regexp_replace(path, '\\\\[[0-9]+\\\\]', '[*]') as path,
+          case
+            when typeof(value) = 'INTEGER' then 'decimal'
+            when typeof(value) = 'DOUBLE' then 'decimal'
+          else lower(typeof(value)) end as type
+        from
+          (${sampleClause})
+            ,table(flatten(input => o, recursive => true)) as meta
+        where typeof(value) != 'NULL_VALUE'
+        group by 1, 2
+        order by 1;
       `;
-      const limitClause =
-        `select object_construct(${variantArgs}) o` +
-        ` from ${tablePath} limit 100`;
-      // Try TABLESAMPLE first — it picks random micro-partitions without
-      // scanning the whole table, which avoids the full-scan problem on
-      // large partitioned tables. TABLESAMPLE only works on base tables,
-      // not views, so if it fails we fall back to a plain LIMIT 100.
-      const tablesampleClause =
-        `select object_construct(${variantArgs}) o` +
-        ` from ${tablePath} TABLESAMPLE BLOCK (1) limit 100`;
-      const fieldPathRows = await this.runSchemaSample(
-        makeSampleQuery(tablesampleClause),
-        makeSampleQuery(limitClause)
+      const projectVariants = `select object_construct(${variantArgs}) o`;
+      const probe = await this.probeTableSize(tablePath);
+      const strategy = pickSampleStrategy(
+        probe,
+        this.schemaSampleFullScanMaxBytes
       );
+      const n = this.schemaSampleRowLimit;
+      let fieldPathRows: QueryRecord[] | undefined;
+      if (strategy === 'full-scan-then-sample') {
+        // Small base table: one full scan catches rare fields that
+        // sampling would miss. tryBatch so a failure doesn't poison
+        // the pool connection (temp views live on it). On failure we
+        // fall through to the sample path so a slow or timed-out full
+        // scan still gets partial structure.
+        fieldPathRows =
+          (await this.executor.tryBatch(
+            makeSampleQuery(`${projectVariants} from ${tablePath}`),
+            {},
+            this.schemaSampleTimeoutMs
+          )) ?? undefined;
+      }
       if (fieldPathRows === undefined) {
-        // Both attempts failed or timed out — treat variants as opaque.
-        for (const name of variants) {
-          structDef.fields.push({type: 'sql native', rawType: 'variant', name});
+        const tablesampleQuery = makeSampleQuery(
+          `${projectVariants} from ${tablePath} TABLESAMPLE BLOCK (1) limit ${n}`
+        );
+        if (strategy === 'tablesample-only') {
+          // Known-large base table: TABLESAMPLE is safe (reads a few
+          // micro-partitions), plain LIMIT without a WHERE can be
+          // catastrophic on large partitioned tables. If TABLESAMPLE
+          // fails here we accept variant rather than risk an unbounded
+          // scan.
+          fieldPathRows =
+            (await this.executor.tryBatch(
+              tablesampleQuery,
+              {},
+              this.schemaSampleTimeoutMs
+            )) ?? undefined;
+        } else {
+          // Unknown size (view, temp view, non-parseable name) or
+          // full-scan fallback: best-effort TABLESAMPLE→LIMIT chain.
+          // The LIMIT fallback is the acknowledged "can't help" case
+          // for views over large partitioned tables.
+          fieldPathRows = await this.runSchemaSample(
+            tablesampleQuery,
+            makeSampleQuery(`${projectVariants} from ${tablePath} limit ${n}`)
+          );
         }
-      } else {
-        // Take the schema in list form and convert it into a tree.
-        const rootObject = new SnowObject('__root__', this.dialect);
+      }
+      const state = createVariantSchemaState();
+      // Snowflake nested-schema inference follows these rules:
+      // - top-level ARRAY/OBJECT from DESCRIBE are authoritative
+      // - descendant paths imply ancestor shape
+      // - conflicting shapes degrade only that prefix to variant
+      // - every top-level nested column still produces a field
+      for (const nestedColumn of nestedColumns) {
+        seedTopLevelShape(state, nestedColumn);
+      }
+      if (fieldPathRows !== undefined) {
         for (const f of fieldPathRows) {
           const pathString = f['PATH']?.valueOf().toString();
           const fieldType = f['TYPE']?.valueOf().toString();
           if (pathString === undefined || fieldType === undefined) continue;
           const pathParser = new PathParser(pathString);
-          const path = pathParser.pathChain();
-          if ('name' in path && notVariant.get(path.name)) {
+          const segments = pathParser.segments();
+          const topLevel = segments[0];
+          if (topLevel?.kind !== 'name' || notVariant.get(topLevel.name)) {
             continue;
           }
-          rootObject.walk(path, fieldType);
+          accumulateVariantPath(state, segments, fieldType);
         }
-        structDef.fields.push(...rootObject.fields);
+      }
+      // Always emit one field per top-level nested column from DESCRIBE, even
+      // if sampling produced no usable descendant paths.
+      for (const nestedColumn of nestedColumns) {
+        structDef.fields.push(
+          buildTopLevelField(nestedColumn, state, this.dialect)
+        );
       }
     }
   }
+  /**
+   * Cheap metadata probe: ask INFORMATION_SCHEMA.TABLES for the row count
+   * and byte size of tablePath. Returns undefined when the name doesn't
+   * parse as a two- or three-part identifier, when the probe query fails,
+   * or when the row has no numeric BYTES (views and external tables
+   * typically report NULL).
+   *
+   * Two-part `schema.table` names use the current database's
+   * INFORMATION_SCHEMA; three-part `db.schema.table` names address
+   * INFORMATION_SCHEMA in the named database. Identifiers are parsed
+   * with Snowflake's quoting rules so bare parts case-fold to upper and
+   * quoted parts are compared verbatim against the catalog.
+   */
+  private async probeTableSize(
+    tablePath: string
+  ): Promise<TableSizeProbe | undefined> {
+    const parsed = parseSnowflakeTableName(tablePath);
+    if (parsed === undefined || parsed.schema === undefined) return undefined;
+    const quoteLit = (s: string) => s.replace(/'/g, "''");
+    const dbQualifier = parsed.database ? `${parsed.database.sql}.` : '';
+    const rows = await this.executor.tryBatch(
+      `select row_count as rc, bytes as by
+       from ${dbQualifier}information_schema.tables
+       where table_schema = '${quoteLit(parsed.schema.literal)}'
+         and table_name = '${quoteLit(parsed.table.literal)}'
+       limit 1`,
+      {},
+      this.schemaSampleTimeoutMs
+    );
+    if (!rows || rows.length === 0) return undefined;
+    const row = rows[0];
+    const bytesRaw = row['BY'] ?? row['by'];
+    const rowsRaw = row['RC'] ?? row['rc'];
+    // Views and external tables surface null BYTES / ROW_COUNT; treat
+    // that as "unknown size" so we don't classify them as small and
+    // launch a full scan against something potentially huge.
+    if (bytesRaw === null || bytesRaw === undefined) return undefined;
+    if (rowsRaw === null || rowsRaw === undefined) return undefined;
+    const bytes = Number(bytesRaw);
+    const rowCount = Number(rowsRaw);
+    if (!Number.isFinite(bytes) || !Number.isFinite(rowCount)) return undefined;
+    return {bytes, rowCount};
+  }
   /**
    * Try to run a schema sampling query, with fallback.
    * First tries the primary query (e.g. using TABLESAMPLE for speed).
@@ -535,54 +542,3 @@ export class SnowflakeConnection
     return tableName;
   }
 }
-export class PathParser extends TinyParser {
-  constructor(pathName: string) {
-    super(pathName, {
-      quoted: /^'(\\'|[^'])*'/,
-      array_of: /^\[\*]/,
-      char: /^[[.\]]/,
-      number: /^\d+/,
-      word: /^\w+/,
-    });
-  }
-  getName() {
-    const nameStart = this.next();
-    if (nameStart.type === 'word') {
-      return nameStart.text;
-    }
-    if (nameStart.type === '[') {
-      const quotedName = this.next('quoted');
-      this.next(']');
-      return quotedName.text;
-    }
-    throw this.parseError('Expected column name');
-  }
-  pathChain(): PathChain {
-    const chain: PathChain = {name: this.getName()};
-    let node: PathChain = chain;
-    for (;;) {
-      const sep = this.next();
-      if (sep.type === 'eof') {
-        return chain;
-      }
-      if (sep.type === '.') {
-        node.next = {name: this.next('word').text};
-        node = node.next;
-      } else if (sep.type === 'array_of') {
-        node.next = {arrayRef: true};
-        node = node.next;
-      } else if (sep.type === '[') {
-        // Actually a dot access through a quoted name
-        const quoted = this.next('quoted');
-        node.next = {name: quoted.text};
-        node = node.next;
-        this.next(']');
-      } else {
-        throw this.parseError(`Unexpected ${sep.type}`);
-      }
-    }
-  }
-}

package/src/snowflake_sample_strategy.spec.ts ADDED Viewed

@@ -0,0 +1,130 @@
+/*
+ * Copyright Contributors to the Malloy project
+ * SPDX-License-Identifier: MIT
+ */
+import {pickSampleStrategy} from './snowflake_connection';
+import {parseSnowflakeTableName} from './snowflake_table_name';
+describe('pickSampleStrategy', () => {
+  const threshold = 100_000_000;
+  test('no probe → best-effort tablesample-then-limit', () => {
+    expect(pickSampleStrategy(undefined, threshold)).toBe(
+      'tablesample-then-limit'
+    );
+  });
+  test('probe at or below threshold → full-scan-then-sample', () => {
+    expect(pickSampleStrategy({bytes: 0, rowCount: 0}, threshold)).toBe(
+      'full-scan-then-sample'
+    );
+    expect(pickSampleStrategy({bytes: threshold, rowCount: 1}, threshold)).toBe(
+      'full-scan-then-sample'
+    );
+  });
+  test('probe above threshold → tablesample-only (no unsafe LIMIT fallback)', () => {
+    expect(
+      pickSampleStrategy({bytes: threshold + 1, rowCount: 1}, threshold)
+    ).toBe('tablesample-only');
+    expect(
+      pickSampleStrategy(
+        {bytes: 10_000_000_000, rowCount: 1_000_000_000},
+        threshold
+      )
+    ).toBe('tablesample-only');
+  });
+  test('threshold=0 forces every probed table into tablesample-only', () => {
+    expect(pickSampleStrategy({bytes: 1, rowCount: 1}, 0)).toBe(
+      'tablesample-only'
+    );
+  });
+});
+describe('parseSnowflakeTableName', () => {
+  test('single bare identifier', () => {
+    expect(parseSnowflakeTableName('aircraft')).toEqual({
+      table: {literal: 'AIRCRAFT', sql: 'AIRCRAFT', quoted: false},
+    });
+  });
+  test('two-part bare name uppercases both parts', () => {
+    expect(parseSnowflakeTableName('malloytest.aircraft')).toEqual({
+      schema: {literal: 'MALLOYTEST', sql: 'MALLOYTEST', quoted: false},
+      table: {literal: 'AIRCRAFT', sql: 'AIRCRAFT', quoted: false},
+    });
+  });
+  test('three-part bare name', () => {
+    expect(parseSnowflakeTableName('db.sch.t')).toEqual({
+      database: {literal: 'DB', sql: 'DB', quoted: false},
+      schema: {literal: 'SCH', sql: 'SCH', quoted: false},
+      table: {literal: 'T', sql: 'T', quoted: false},
+    });
+  });
+  test('quoted identifier preserves case', () => {
+    expect(parseSnowflakeTableName('"MyDb"."schema"."t"')).toEqual({
+      database: {literal: 'MyDb', sql: '"MyDb"', quoted: true},
+      schema: {literal: 'schema', sql: '"schema"', quoted: true},
+      table: {literal: 't', sql: '"t"', quoted: true},
+    });
+  });
+  test('quoted identifier allows embedded dots', () => {
+    expect(parseSnowflakeTableName('"a.b"."c.d"')).toEqual({
+      schema: {literal: 'a.b', sql: '"a.b"', quoted: true},
+      table: {literal: 'c.d', sql: '"c.d"', quoted: true},
+    });
+  });
+  test('doubled double-quote is a literal quote', () => {
+    expect(parseSnowflakeTableName('"a""b"')).toEqual({
+      table: {literal: 'a"b', sql: '"a""b"', quoted: true},
+    });
+  });
+  test('mixes quoted and bare parts', () => {
+    expect(parseSnowflakeTableName('MYDB."mixed"')).toEqual({
+      schema: {literal: 'MYDB', sql: 'MYDB', quoted: false},
+      table: {literal: 'mixed', sql: '"mixed"', quoted: true},
+    });
+  });
+  test('tolerates surrounding whitespace and whitespace around dots', () => {
+    expect(parseSnowflakeTableName(' sch . t ')).toEqual({
+      schema: {literal: 'SCH', sql: 'SCH', quoted: false},
+      table: {literal: 'T', sql: 'T', quoted: false},
+    });
+  });
+  test('returns undefined for empty input', () => {
+    expect(parseSnowflakeTableName('')).toBeUndefined();
+  });
+  test('returns undefined for four-part name', () => {
+    expect(parseSnowflakeTableName('a.b.c.d')).toBeUndefined();
+  });
+  test('returns undefined for trailing dot', () => {
+    expect(parseSnowflakeTableName('sch.')).toBeUndefined();
+  });
+  test('returns undefined for leading dot', () => {
+    expect(parseSnowflakeTableName('.t')).toBeUndefined();
+  });
+  test('returns undefined for unterminated quoted identifier', () => {
+    expect(parseSnowflakeTableName('"oops')).toBeUndefined();
+  });
+  test('returns undefined for identifier starting with a digit', () => {
+    expect(parseSnowflakeTableName('1foo')).toBeUndefined();
+  });
+  test('returns undefined for identifier containing a dash', () => {
+    expect(parseSnowflakeTableName('foo-bar')).toBeUndefined();
+  });
+});