npm - sql-fmt-cli - Versions diffs - 1.0.0 - Mend

sql-fmt-cli 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/README.md ADDED Viewed

@@ -0,0 +1,61 @@
+# sql-fmt-cli
+> Format SQL queries from stdin or file — uppercase keywords, one clause per line, indent subqueries. Zero dependencies.
+[![npm version](https://img.shields.io/npm/v/sql-fmt-cli.svg)](https://www.npmjs.com/package/sql-fmt-cli)
+[![license](https://img.shields.io/npm/l/sql-fmt-cli.svg)](LICENSE)
+## Install
+```bash
+npm install -g sql-fmt-cli
+```
+## Usage
+```bash
+# Format a file in-place (prints to stdout)
+sqlfmt query.sql
+# Pipe from stdin
+echo "select id,name from users where active=1 order by name" | sqlfmt
+# CI check — exits 1 if not formatted
+sqlfmt query.sql --check
+```
+## Example
+Input:
+```sql
+select id,name from users where active=1 order by name
+```
+Output:
+```sql
+SELECT id,
+       name
+FROM users
+WHERE active = 1
+ORDER BY name
+```
+## Features
+- Uppercases all SQL keywords (`SELECT`, `FROM`, `WHERE`, `JOIN`, `GROUP BY`, …)
+- Puts each clause on its own line
+- Indents subqueries inside parentheses
+- Handles quoted strings and identifiers without corrupting them
+- Preserves `--` line comments and `/* */` block comments
+- `--check` flag for CI pipelines
+- Zero runtime dependencies — pure Node.js
+## Supported SQL
+Works with MySQL, PostgreSQL, SQLite, and most ANSI SQL dialects.
+Supports: `SELECT`, `FROM`, `WHERE`, `JOIN` variants, `GROUP BY`, `HAVING`, `ORDER BY`, `LIMIT`, `OFFSET`, `UNION`, `INSERT`, `UPDATE`, `DELETE`, `CREATE TABLE`, `ALTER TABLE`, `WITH` (CTEs), window functions, `CASE` expressions, and more.
+## License
+MIT

package/index.js ADDED Viewed

@@ -0,0 +1,410 @@
+#!/usr/bin/env node
+'use strict';
+const fs = require('fs');
+const path = require('path');
+// SQL keywords to uppercase — ordered longest-first to avoid partial matches
+const KEYWORDS = [
+  'SELECT', 'DISTINCT', 'FROM', 'WHERE', 'GROUP BY', 'HAVING', 'ORDER BY',
+  'LIMIT', 'OFFSET', 'INNER JOIN', 'LEFT JOIN', 'RIGHT JOIN', 'FULL JOIN',
+  'FULL OUTER JOIN', 'LEFT OUTER JOIN', 'RIGHT OUTER JOIN', 'CROSS JOIN',
+  'JOIN', 'ON', 'AS', 'AND', 'OR', 'NOT', 'IN', 'EXISTS', 'BETWEEN',
+  'LIKE', 'ILIKE', 'IS NULL', 'IS NOT NULL', 'NULL', 'TRUE', 'FALSE',
+  'CASE', 'WHEN', 'THEN', 'ELSE', 'END', 'UNION ALL', 'UNION', 'INTERSECT',
+  'EXCEPT', 'INSERT INTO', 'INSERT', 'INTO', 'VALUES', 'UPDATE', 'SET',
+  'DELETE FROM', 'DELETE', 'CREATE TABLE', 'CREATE INDEX', 'CREATE VIEW',
+  'CREATE', 'DROP TABLE', 'DROP', 'ALTER TABLE', 'ALTER', 'ADD COLUMN',
+  'ADD', 'COLUMN', 'PRIMARY KEY', 'FOREIGN KEY', 'REFERENCES', 'UNIQUE',
+  'DEFAULT', 'NOT NULL', 'AUTO_INCREMENT', 'AUTOINCREMENT', 'SERIAL',
+  'WITH', 'RECURSIVE', 'OVER', 'PARTITION BY', 'ROW_NUMBER', 'RANK',
+  'DENSE_RANK', 'COALESCE', 'NULLIF', 'CAST', 'CONVERT', 'COUNT', 'SUM',
+  'AVG', 'MIN', 'MAX', 'IF', 'IFNULL',
+  'ASC', 'DESC', 'ALL', 'ANY', 'SOME', 'TRUNCATE', 'EXPLAIN', 'ANALYZE',
+  'RETURNING', 'CONFLICT', 'DO NOTHING', 'DO UPDATE',
+];
+// Clause-level keywords that each get their own line (top-level only)
+const CLAUSE_KEYWORDS = [
+  'SELECT', 'DISTINCT', 'FROM', 'WHERE', 'GROUP BY', 'HAVING', 'ORDER BY',
+  'LIMIT', 'OFFSET',
+  'INNER JOIN', 'LEFT JOIN', 'RIGHT JOIN', 'FULL JOIN',
+  'FULL OUTER JOIN', 'LEFT OUTER JOIN', 'RIGHT OUTER JOIN', 'CROSS JOIN',
+  'JOIN', 'ON',
+  'UNION ALL', 'UNION', 'INTERSECT', 'EXCEPT',
+  'INSERT INTO', 'INSERT', 'INTO', 'VALUES', 'UPDATE', 'SET',
+  'DELETE FROM', 'DELETE',
+  'CREATE TABLE', 'CREATE INDEX', 'CREATE VIEW', 'CREATE',
+  'DROP TABLE', 'DROP', 'ALTER TABLE', 'ALTER',
+  'WITH', 'RETURNING', 'EXPLAIN', 'ANALYZE',
+];
+// Sort by length descending so multi-word phrases match before single words
+CLAUSE_KEYWORDS.sort((a, b) => b.length - a.length);
+KEYWORDS.sort((a, b) => b.length - a.length);
+/**
+ * Tokenize SQL into an array of tokens: { type, value }
+ * Types: string, comment_line, comment_block, paren_open, paren_close,
+ *        comma, semicolon, whitespace, word
+ */
+function tokenize(sql) {
+  const tokens = [];
+  let i = 0;
+  while (i < sql.length) {
+    // Single-quoted string
+    if (sql[i] === "'") {
+      let j = i + 1;
+      while (j < sql.length) {
+        if (sql[j] === "'" && sql[j + 1] === "'") { j += 2; continue; }
+        if (sql[j] === "'") { j++; break; }
+        j++;
+      }
+      tokens.push({ type: 'string', value: sql.slice(i, j) });
+      i = j;
+      continue;
+    }
+    // Double-quoted identifier
+    if (sql[i] === '"') {
+      let j = i + 1;
+      while (j < sql.length) {
+        if (sql[j] === '"' && sql[j + 1] === '"') { j += 2; continue; }
+        if (sql[j] === '"') { j++; break; }
+        j++;
+      }
+      tokens.push({ type: 'string', value: sql.slice(i, j) });
+      i = j;
+      continue;
+    }
+    // Backtick identifier
+    if (sql[i] === '`') {
+      let j = i + 1;
+      while (j < sql.length && sql[j] !== '`') j++;
+      tokens.push({ type: 'string', value: sql.slice(i, j + 1) });
+      i = j + 1;
+      continue;
+    }
+    // Line comment
+    if (sql[i] === '-' && sql[i + 1] === '-') {
+      let j = i;
+      while (j < sql.length && sql[j] !== '\n') j++;
+      tokens.push({ type: 'comment_line', value: sql.slice(i, j) });
+      i = j;
+      continue;
+    }
+    // Block comment
+    if (sql[i] === '/' && sql[i + 1] === '*') {
+      let j = i + 2;
+      while (j < sql.length && !(sql[j] === '*' && sql[j + 1] === '/')) j++;
+      tokens.push({ type: 'comment_block', value: sql.slice(i, j + 2) });
+      i = j + 2;
+      continue;
+    }
+    // Parens
+    if (sql[i] === '(') { tokens.push({ type: 'paren_open', value: '(' }); i++; continue; }
+    if (sql[i] === ')') { tokens.push({ type: 'paren_close', value: ')' }); i++; continue; }
+    // Comma
+    if (sql[i] === ',') { tokens.push({ type: 'comma', value: ',' }); i++; continue; }
+    // Semicolon
+    if (sql[i] === ';') { tokens.push({ type: 'semicolon', value: ';' }); i++; continue; }
+    // Whitespace
+    if (/\s/.test(sql[i])) {
+      let j = i;
+      while (j < sql.length && /\s/.test(sql[j])) j++;
+      tokens.push({ type: 'whitespace', value: sql.slice(i, j) });
+      i = j;
+      continue;
+    }
+    // Word / symbol
+    let j = i;
+    while (j < sql.length && !/[\s(),;'"` ]/.test(sql[j])) j++;
+    if (j === i) j++; // consume at least one char
+    tokens.push({ type: 'word', value: sql.slice(i, j) });
+    i = j;
+  }
+  return tokens;
+}
+/**
+ * Uppercase SQL keywords in a flat token stream (preserves strings/comments).
+ * Returns modified tokens.
+ */
+function uppercaseKeywords(tokens) {
+  // Build a flat text version of non-string tokens so we can pattern-match
+  // multi-word keywords that may be split across token boundaries.
+  // Strategy: join adjacent word/whitespace tokens, then do keyword replacement.
+  const result = [];
+  let i = 0;
+  while (i < tokens.length) {
+    const tok = tokens[i];
+    // Preserve strings and comments verbatim
+    if (tok.type === 'string' || tok.type === 'comment_line' || tok.type === 'comment_block') {
+      result.push(tok);
+      i++;
+      continue;
+    }
+    if (tok.type === 'word') {
+      // Try to match a multi-word keyword starting here
+      let matched = false;
+      for (const kw of KEYWORDS) {
+        const parts = kw.split(' ');
+        if (parts.length === 1) {
+          if (tok.value.toUpperCase() === kw) {
+            result.push({ type: 'word', value: kw });
+            i++;
+            matched = true;
+            break;
+          }
+        } else {
+          // Multi-word: gather upcoming word tokens (skip single whitespace between)
+          let j = i;
+          let p = 0;
+          const consumed = [];
+          while (p < parts.length && j < tokens.length) {
+            // Skip whitespace tokens between words
+            if (tokens[j].type === 'whitespace' && p > 0) {
+              consumed.push(tokens[j]);
+              j++;
+              continue;
+            }
+            if (tokens[j].type === 'word' && tokens[j].value.toUpperCase() === parts[p]) {
+              consumed.push(tokens[j]);
+              j++;
+              p++;
+            } else {
+              break;
+            }
+          }
+          if (p === parts.length) {
+            // Replace with a single uppercase keyword token (spaces normalised)
+            result.push({ type: 'word', value: kw });
+            i = j;
+            matched = true;
+            break;
+          }
+        }
+      }
+      if (!matched) {
+        result.push(tok);
+        i++;
+      }
+      continue;
+    }
+    result.push(tok);
+    i++;
+  }
+  return result;
+}
+/**
+ * Rebuild a formatted SQL string from the token stream.
+ * - Top-level clause keywords start on a new line (depth === 0)
+ * - Content inside parentheses is indented by 2 spaces per depth level
+ * - Commas at top level produce a newline + indent continuation
+ */
+function format(tokens, indentStr = '  ') {
+  let depth = 0;
+  let output = '';
+  let lineIsEmpty = true;
+  // Helper: current indent prefix for depth
+  const indent = (d) => indentStr.repeat(d);
+  // We'll do a second pass to insert newlines before clause keywords at depth 0
+  // First reconstruct a compact (single-space) version of the token values
+  const parts = [];
+  let i = 0;
+  while (i < tokens.length) {
+    const tok = tokens[i];
+    if (tok.type === 'whitespace') { parts.push({ type: 'ws' }); i++; continue; }
+    parts.push(tok);
+    i++;
+  }
+  // Now emit formatted output
+  let out = '';
+  let col = 0; // approximate column position
+  let prevNonWs = null;
+  function emit(str) {
+    out += str;
+    const lastNl = str.lastIndexOf('\n');
+    if (lastNl >= 0) col = str.length - lastNl - 1;
+    else col += str.length;
+  }
+  function newline(d) {
+    out += '\n' + indent(d);
+    col = indent(d).length;
+  }
+  // Trim leading/trailing whitespace tokens
+  let start = 0;
+  let end = parts.length - 1;
+  while (start <= end && parts[start].type === 'ws') start++;
+  while (end >= start && parts[end].type === 'ws') end--;
+  for (let idx = start; idx <= end; idx++) {
+    const p = parts[idx];
+    if (p.type === 'ws') {
+      // We'll handle spacing contextually; skip raw whitespace
+      continue;
+    }
+    if (p.type === 'paren_open') {
+      emit('(');
+      depth++;
+      // Look ahead: if next non-ws is a clause keyword, newline+indent
+      let next = idx + 1;
+      while (next <= end && parts[next].type === 'ws') next++;
+      if (next <= end && parts[next].type === 'word') {
+        const nv = parts[next].value;
+        if (CLAUSE_KEYWORDS.includes(nv)) {
+          newline(depth);
+        }
+      }
+      prevNonWs = p;
+      continue;
+    }
+    if (p.type === 'paren_close') {
+      depth = Math.max(0, depth - 1);
+      // If previous output doesn't end in a newline+indent, just close
+      if (out.length > 0 && out[out.length - 1] !== '\n' && col > 0) {
+        // Check if the open-paren content had newlines (subquery style)
+        const lastNl = out.lastIndexOf('\n');
+        if (lastNl >= 0 && out.slice(lastNl + 1).trim() === '') {
+          // Already on its own line — just close
+          out = out.slice(0, lastNl + 1) + indent(depth) + ')';
+          col = indent(depth).length + 1;
+        } else {
+          emit(')');
+        }
+      } else {
+        emit(')');
+      }
+      prevNonWs = p;
+      continue;
+    }
+    if (p.type === 'comma') {
+      emit(',');
+      if (depth === 0) {
+        newline(0);
+        // Emit an indent to align with SELECT columns
+        emit('       '); // 7 spaces aligns under "SELECT "
+      } else {
+        // Inside parens: comma + space
+        emit(' ');
+      }
+      prevNonWs = p;
+      continue;
+    }
+    if (p.type === 'semicolon') {
+      emit(';');
+      if (idx < end) {
+        out += '\n\n';
+        col = 0;
+        depth = 0;
+      }
+      prevNonWs = p;
+      continue;
+    }
+    if (p.type === 'word') {
+      // Check if it's a clause keyword at depth 0
+      if (depth === 0 && CLAUSE_KEYWORDS.includes(p.value)) {
+        const isFirst = (prevNonWs === null);
+        if (!isFirst) {
+          newline(0);
+        }
+        emit(p.value);
+        emit(' ');
+        prevNonWs = p;
+        continue;
+      }
+      // Otherwise emit with space separation
+      if (prevNonWs !== null &&
+          prevNonWs.type !== 'paren_open' &&
+          prevNonWs.type !== 'comma' &&
+          !(prevNonWs.type === 'word' && out.endsWith(' '))) {
+        // Don't double-space
+        if (!out.endsWith(' ') && !out.endsWith('\n')) emit(' ');
+      }
+      emit(p.value);
+      prevNonWs = p;
+      continue;
+    }
+    // string / comment
+    if (prevNonWs !== null &&
+        prevNonWs.type !== 'paren_open' &&
+        prevNonWs.type !== 'comma' &&
+        !out.endsWith(' ') && !out.endsWith('\n')) {
+      emit(' ');
+    }
+    emit(p.value);
+    prevNonWs = p;
+  }
+  // Trim trailing whitespace on each line
+  out = out.split('\n').map(l => l.trimEnd()).join('\n');
+  // Ensure single trailing newline
+  out = out.trimEnd() + '\n';
+  return out;
+}
+function formatSQL(sql) {
+  const tokens = tokenize(sql);
+  const upped = uppercaseKeywords(tokens);
+  return format(upped);
+}
+// ─── CLI ───────────────────────────────────────────────────────────────────
+const args = process.argv.slice(2);
+const checkMode = args.includes('--check');
+const fileArgs = args.filter(a => !a.startsWith('--'));
+function run(sql) {
+  const formatted = formatSQL(sql);
+  if (checkMode) {
+    const normalIn = formatSQL(sql);
+    if (normalIn === formatted) {
+      process.stdout.write('SQL is already formatted.\n');
+      process.exit(0);
+    } else {
+      process.stderr.write('SQL is not formatted. Run sqlfmt to fix.\n');
+      process.exit(1);
+    }
+  }
+  process.stdout.write(formatted);
+}
+if (fileArgs.length > 0) {
+  // Read from file(s)
+  fileArgs.forEach(filePath => {
+    const abs = path.resolve(filePath);
+    if (!fs.existsSync(abs)) {
+      process.stderr.write(`sqlfmt: file not found: ${filePath}\n`);
+      process.exit(1);
+    }
+    const sql = fs.readFileSync(abs, 'utf8');
+    run(sql);
+  });
+} else {
+  // Read from stdin
+  let input = '';
+  process.stdin.setEncoding('utf8');
+  process.stdin.on('data', chunk => { input += chunk; });
+  process.stdin.on('end', () => {
+    if (!input.trim()) {
+      process.stderr.write('sqlfmt: no input. Usage: sqlfmt query.sql  or  echo "SELECT ..." | sqlfmt\n');
+      process.exit(1);
+    }
+    run(input);
+  });
+  process.stdin.resume();
+}

package/package.json ADDED Viewed

@@ -0,0 +1,35 @@
+{
+  "name": "sql-fmt-cli",
+  "version": "1.0.0",
+  "description": "Format SQL queries from stdin or file — uppercase keywords, one clause per line, indent subqueries",
+  "main": "index.js",
+  "bin": {
+    "sqlfmt": "./index.js"
+  },
+  "scripts": {
+    "test": "echo \"select id,name from users where active=1 order by name\" | node index.js"
+  },
+  "keywords": [
+    "sql",
+    "format",
+    "prettier",
+    "cli",
+    "database",
+    "formatter",
+    "sql-formatter",
+    "query",
+    "mysql",
+    "postgres",
+    "sqlite"
+  ],
+  "author": "chengyixu",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "https://github.com/chengyixu/sql-fmt-cli"
+  },
+  "homepage": "https://github.com/chengyixu/sql-fmt-cli#readme",
+  "engines": {
+    "node": ">=12.0.0"
+  }
+}