npm - design-clone - Versions diffs - 1.2.0 → 2.1.0 - Mend

design-clone 1.2.0 → 2.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (66) hide show

package/README.md +26 -12
package/bin/commands/clone-site.js +75 -10
package/bin/commands/init.js +33 -1
package/bin/commands/verify.js +5 -3
package/bin/utils/validate.js +24 -8
package/docs/cli-reference.md +200 -2
package/docs/codebase-summary.md +309 -0
package/docs/design-clone-architecture.md +259 -42
package/docs/pixel-perfect.md +35 -4
package/docs/project-roadmap.md +382 -0
package/docs/troubleshooting.md +5 -4
package/package.json +10 -8
package/src/ai/__pycache__/analyze-structure.cpython-313.pyc +0 -0
package/src/ai/__pycache__/extract-design-tokens.cpython-313.pyc +0 -0
package/src/ai/analyze-structure.py +73 -3
package/src/ai/extract-design-tokens.py +356 -13
package/src/ai/prompts/__pycache__/design_tokens.cpython-313.pyc +0 -0
package/src/ai/prompts/__pycache__/structure_analysis.cpython-313.pyc +0 -0
package/src/ai/prompts/__pycache__/ux_audit.cpython-313.pyc +0 -0
package/src/ai/prompts/design_tokens.py +133 -0
package/src/ai/prompts/structure_analysis.py +329 -10
package/src/ai/prompts/ux_audit.py +198 -0
package/src/ai/ux-audit.js +596 -0
package/src/core/app-state-snapshot.js +511 -0
package/src/core/content-counter.js +342 -0
package/src/core/cookie-handler.js +1 -1
package/src/core/css-extractor.js +4 -4
package/src/core/dimension-extractor.js +93 -21
package/src/core/dimension-output.js +103 -6
package/src/core/discover-pages.js +242 -14
package/src/core/dom-tree-analyzer.js +298 -0
package/src/core/extract-assets.js +1 -1
package/src/core/framework-detector.js +538 -0
package/src/core/html-extractor.js +45 -4
package/src/core/lazy-loader.js +7 -7
package/src/core/multi-page-screenshot.js +9 -6
package/src/core/page-readiness.js +8 -8
package/src/core/screenshot.js +138 -9
package/src/core/section-cropper.js +209 -0
package/src/core/section-detector.js +386 -0
package/src/core/semantic-enhancer.js +492 -0
package/src/core/state-capture.js +18 -22
package/src/core/tests/test-section-cropper.js +177 -0
package/src/core/tests/test-section-detector.js +55 -0
package/src/core/video-capture.js +152 -146
package/src/route-discoverers/angular-discoverer.js +157 -0
package/src/route-discoverers/astro-discoverer.js +123 -0
package/src/route-discoverers/base-discoverer.js +242 -0
package/src/route-discoverers/index.js +106 -0
package/src/route-discoverers/next-discoverer.js +130 -0
package/src/route-discoverers/nuxt-discoverer.js +138 -0
package/src/route-discoverers/react-discoverer.js +139 -0
package/src/route-discoverers/svelte-discoverer.js +109 -0
package/src/route-discoverers/universal-discoverer.js +227 -0
package/src/route-discoverers/vue-discoverer.js +118 -0
package/src/utils/__init__.py +1 -1
package/src/utils/__pycache__/__init__.cpython-313.pyc +0 -0
package/src/utils/browser.js +11 -37
package/src/utils/playwright.js +213 -0
package/src/verification/generate-audit-report.js +398 -0
package/src/verification/verify-footer.js +493 -0
package/src/verification/verify-header.js +486 -0
package/src/verification/verify-layout.js +2 -2
package/src/verification/verify-menu.js +4 -20
package/src/verification/verify-slider.js +533 -0
package/src/utils/puppeteer.js +0 -281

package/src/core/dimension-output.js CHANGED Viewed

@@ -89,7 +89,18 @@ export function sanitizeViewportData(data, vpName) {
 }
 /**
- * Build cross-viewport summary for AI consumption
+ * Build cross-viewport summary for AI consumption.
+ * Includes section-aware typography and container data.
+ *
+ * @param {Object} viewports - Viewport data keyed by name (desktop, tablet, mobile)
+ * @returns {Object} Summary with:
+ *   - maxContainerWidth: Largest container width across all viewports
+ *   - commonGap: Average gap from card patterns
+ *   - breakpoints: Viewport width breakpoints
+ *   - typography: Flat h1/h2/h3/body sizes by viewport (backward compat)
+ *   - typographyBySection: Typography grouped by section context (hero h1 != content h1)
+ *   - cardPatterns: Card group statistics
+ *   - sections: Section detection summary (found flag + width/containerWidth)
  */
 export function buildCrossViewportSummary(viewports) {
   const summary = {
@@ -100,31 +111,83 @@ export function buildCrossViewportSummary(viewports) {
       tablet: VIEWPORTS.tablet.width,
       mobile: VIEWPORTS.mobile.width
     },
+    // Flat typography for backward compatibility
     typography: { h1: {}, h2: {}, h3: {}, body: {} },
-    cardPatterns: { totalGroups: 0, avgCardSize: null }
+    // NEW: Typography by section context
+    typographyBySection: {
+      hero: {},
+      content: {},
+      header: {},
+      footer: {},
+      sidebar: {}
+    },
+    cardPatterns: { totalGroups: 0, avgCardSize: null },
+    // NEW: Section summary
+    sections: {
+      hero: { found: false, containerWidth: null },
+      content: { found: false, containerWidth: null },
+      header: { found: false, containerWidth: null },
+      footer: { found: false, containerWidth: null },
+      sidebar: { found: false, width: null }
+    }
   };
   for (const [vpName, vpData] of Object.entries(viewports)) {
     if (!vpData) continue;
+    // Container section mapping
     if (vpData.containers) {
       for (const container of vpData.containers) {
         if (container.width > summary.maxContainerWidth) {
           summary.maxContainerWidth = container.width;
         }
+        // Track section widths
+        const section = container.section || 'content';
+        if (summary.sections[section]) {
+          summary.sections[section].found = true;
+          // Sidebar uses 'width' field, others use 'containerWidth'
+          if (section === 'sidebar') {
+            if (!summary.sections[section].width ||
+                container.width > summary.sections[section].width) {
+              summary.sections[section].width = container.width;
+            }
+          } else {
+            if (!summary.sections[section].containerWidth ||
+                container.width > summary.sections[section].containerWidth) {
+              summary.sections[section].containerWidth = container.width;
+            }
+          }
+        }
       }
     }
+    // Typography by section
     if (vpData.typography) {
       for (const typo of vpData.typography) {
         const tag = typo.selector?.toLowerCase();
-        if (tag === 'h1') summary.typography.h1[vpName] = typo.fontSize;
-        if (tag === 'h2') summary.typography.h2[vpName] = typo.fontSize;
-        if (tag === 'h3') summary.typography.h3[vpName] = typo.fontSize;
-        if (tag === 'p') summary.typography.body[vpName] = typo.fontSize;
+        const section = typo.section || 'content';
+        // Flat typography (backward compat) - take first found
+        if (tag === 'h1' && !summary.typography.h1[vpName]) summary.typography.h1[vpName] = typo.fontSize;
+        if (tag === 'h2' && !summary.typography.h2[vpName]) summary.typography.h2[vpName] = typo.fontSize;
+        if (tag === 'h3' && !summary.typography.h3[vpName]) summary.typography.h3[vpName] = typo.fontSize;
+        if (tag === 'p' && !summary.typography.body[vpName]) summary.typography.body[vpName] = typo.fontSize;
+        // Typography by section
+        if (!summary.typographyBySection[section]) {
+          summary.typographyBySection[section] = {};
+        }
+        if (!summary.typographyBySection[section][tag]) {
+          summary.typographyBySection[section][tag] = {};
+        }
+        // Take first found per section/tag/viewport
+        if (!summary.typographyBySection[section][tag][vpName]) {
+          summary.typographyBySection[section][tag][vpName] = typo.fontSize;
+        }
       }
     }
+    // Card patterns (unchanged)
     if (vpData.cards && vpData.cards.length > 0) {
       summary.cardPatterns.totalGroups += vpData.cards.length;
       if (vpName === 'desktop' && vpData.cards[0]?.avgDimensions) {
@@ -143,6 +206,7 @@ export function buildCrossViewportSummary(viewports) {
 /**
  * Generate AI-friendly summary (compact, <5KB)
+ * Includes section-aware typography for accurate reconstruction
  * @param {Object} fullOutput - Full component-dimensions.json
  * @returns {Object} Compact summary for AI prompts
  */
@@ -173,6 +237,29 @@ export function generateAISummary(fullOutput) {
     };
   }
+  /**
+   * Convert typographyBySection to AI-friendly format with px units
+   */
+  function inferTypographyBySection(typographyBySection) {
+    const result = {};
+    for (const [section, tags] of Object.entries(typographyBySection || {})) {
+      if (!tags || Object.keys(tags).length === 0) continue;
+      result[section] = {};
+      for (const [tag, sizes] of Object.entries(tags)) {
+        // Use desktop first, then tablet, then mobile
+        const size = sizes.desktop || sizes.tablet || sizes.mobile || 0;
+        if (size > 0) {
+          result[section][tag] = size + "px";
+        }
+      }
+      // Remove empty sections
+      if (Object.keys(result[section]).length === 0) {
+        delete result[section];
+      }
+    }
+    return result;
+  }
   return {
     _comment: "USE THESE EXACT VALUES - DO NOT ESTIMATE",
     EXACT_DIMENSIONS: {
@@ -187,6 +274,16 @@ export function generateAISummary(fullOutput) {
       h3: (summary.typography.h3.desktop || 24) + "px",
       body: (summary.typography.body.desktop || 16) + "px"
     },
+    // NEW: Section-aware typography (hero h1 != content h1)
+    TYPOGRAPHY_BY_SECTION: inferTypographyBySection(summary.typographyBySection),
+    // NEW: Section info
+    SECTIONS: {
+      hero: summary.sections?.hero || { found: false },
+      content: summary.sections?.content || { found: false },
+      header: summary.sections?.header || { found: false },
+      footer: summary.sections?.footer || { found: false },
+      sidebar: summary.sections?.sidebar || { found: false }
+    },
     RESPONSIVE: {
       desktop_breakpoint: summary.breakpoints.desktop + "px",
       tablet_breakpoint: summary.breakpoints.tablet + "px",

package/src/core/discover-pages.js CHANGED Viewed

@@ -4,6 +4,11 @@
  * Extracts navigation links from a website to discover cloneable pages.
  * Handles SPA hydration, filters external links, and normalizes URLs.
  *
+ * Enhanced with SPA/Framework support (v1.3):
+ * - Framework detection (Next.js, Nuxt, Vue, React, Angular, Svelte, Astro)
+ * - Framework-specific route discovery
+ * - App state capture (optional)
+ *
  * Usage:
  *   import { discoverPages } from './discover-pages.js';
  *   const result = await discoverPages('https://example.com', { maxPages: 10 });
@@ -13,6 +18,11 @@ import { getBrowser, getPage, disconnectBrowser } from '../utils/browser.js';
 import { waitForDomStable, waitForPageReady } from './page-readiness.js';
 import { dismissCookieBanner } from './cookie-handler.js';
+// SPA/Framework support imports
+import { detectFramework, formatDetectionResult } from './framework-detector.js';
+import { discoverRoutes as discoverFrameworkRoutes } from '../route-discoverers/index.js';
+import { captureAppState, formatStateSnapshot } from './app-state-snapshot.js';
 // Navigation selectors in priority order
 const NAV_SELECTORS = [
   'header nav a',
@@ -41,14 +51,47 @@ const EXCLUDE_PATTERNS = [
   /tiktok\.com/i
 ];
+// Valid framework names for validation
+const VALID_FRAMEWORKS = ['next', 'nuxt', 'vue', 'react', 'angular', 'svelte', 'astro'];
 // Default options
 const DEFAULT_OPTIONS = {
   maxPages: 10,
   selectors: null,  // Use default NAV_SELECTORS if null
   includeSubdomains: false,
-  timeout: 30000
+  timeout: 30000,
+  // SPA/Framework options (v1.3)
+  spaMode: true,         // Enable SPA detection and route discovery
+  framework: null,       // Force specific framework (skip detection)
+  noSpaDetect: false,    // Disable SPA/framework detection entirely
+  captureState: false    // Capture app state (Redux/Vuex/Pinia/Zustand)
 };
+/**
+ * Log warning message (only in TTY mode)
+ * @param {string} message - Warning message
+ */
+function logWarning(message) {
+  if (process.stderr.isTTY) {
+    console.error(`[discover-pages] WARN: ${message}`);
+  }
+}
+/**
+ * Validate and normalize framework option
+ * @param {string|null} framework - Framework name to validate
+ * @returns {string|null} Validated framework name or null
+ */
+function validateFramework(framework) {
+  if (!framework) return null;
+  const normalized = String(framework).toLowerCase().trim();
+  if (VALID_FRAMEWORKS.includes(normalized)) {
+    return normalized;
+  }
+  logWarning(`Invalid framework "${framework}". Valid options: ${VALID_FRAMEWORKS.join(', ')}`);
+  return null;
+}
 /**
  * Normalize URL for comparison and deduplication
  * @param {string} baseUrl - Base URL for resolving relative paths
@@ -140,10 +183,102 @@ function shouldExclude(href) {
   return EXCLUDE_PATTERNS.some(pattern => pattern.test(href));
 }
+/**
+ * Normalize a path (remove trailing slash except for root)
+ * @param {string} path - Path to normalize
+ * @returns {string} Normalized path
+ */
+function normalizePath(path) {
+  if (!path || typeof path !== 'string') return '/';
+  return path.endsWith('/') && path !== '/' ? path.slice(0, -1) : path;
+}
+/**
+ * Merge framework-discovered routes with link-scraped pages
+ * Prioritizes framework routes (higher quality), fills gaps with link-scraped
+ *
+ * @param {Array|null} frameworkRoutes - Routes from framework discoverer
+ * @param {Array|null} linkScrapedPages - Pages from link scraping
+ * @param {string} baseDomain - Base domain for URL normalization
+ * @param {string} baseUrl - Base URL for resolving paths
+ * @returns {Array} Merged and deduplicated pages
+ *
+ * @example
+ * const merged = mergeRoutes(
+ *   [{ path: '/about', name: 'About' }],
+ *   [{ path: '/contact', name: 'Contact' }],
+ *   'example.com',
+ *   'https://example.com'
+ * );
+ */
+function mergeRoutes(frameworkRoutes, linkScrapedPages, baseDomain, baseUrl) {
+  // Input validation
+  if (!baseDomain || typeof baseDomain !== 'string') {
+    logWarning('mergeRoutes: Invalid baseDomain');
+    baseDomain = '';
+  }
+  if (!baseUrl || typeof baseUrl !== 'string') {
+    logWarning('mergeRoutes: Invalid baseUrl');
+    baseUrl = '';
+  }
+  const seenPaths = new Set();
+  const merged = [];
+  // Add framework routes first (higher quality, more accurate)
+  if (Array.isArray(frameworkRoutes)) {
+    for (const route of frameworkRoutes) {
+      if (!route || typeof route !== 'object') continue;
+      const normalizedPath = normalizePath(route.path || '/');
+      if (seenPaths.has(normalizedPath)) continue;
+      seenPaths.add(normalizedPath);
+      const url = normalizeUrl(baseUrl, normalizedPath) || route.url || '';
+      merged.push({
+        path: normalizedPath,
+        name: route.name || extractPageName('', normalizedPath),
+        url,
+        source: route.source || 'framework',
+        dynamic: Boolean(route.dynamic)
+      });
+    }
+  }
+  // Add link-scraped pages (fill gaps)
+  if (Array.isArray(linkScrapedPages)) {
+    for (const page of linkScrapedPages) {
+      if (!page || typeof page !== 'object') continue;
+      const normalizedPath = normalizePath(page.path || '/');
+      if (seenPaths.has(normalizedPath)) continue;
+      seenPaths.add(normalizedPath);
+      merged.push({
+        path: normalizedPath,
+        name: page.name || extractPageName('', normalizedPath),
+        url: page.url || normalizeUrl(baseUrl, normalizedPath) || '',
+        source: 'link-scrape',
+        dynamic: false
+      });
+    }
+  }
+  return merged;
+}
 /**
  * Discover pages from a website by extracting navigation links
+ * Enhanced with SPA/Framework support (v1.3)
+ *
  * @param {string} baseUrl - Starting URL to discover from
  * @param {Object} options - Discovery options
+ * @param {number} [options.maxPages=10] - Maximum pages to discover
+ * @param {boolean} [options.spaMode=true] - Enable SPA detection
+ * @param {string} [options.framework] - Force specific framework
+ * @param {boolean} [options.noSpaDetect=false] - Disable SPA detection
+ * @param {boolean} [options.captureState=false] - Capture app state
  * @returns {Promise<Object>} Discovery result
  */
 export async function discoverPages(baseUrl, options = {}) {
@@ -164,7 +299,7 @@ export async function discoverPages(baseUrl, options = {}) {
     // Navigate to page
     await page.goto(baseUrl, {
-      waitUntil: ['load', 'networkidle0'],
+      waitUntil: 'networkidle',
       timeout: opts.timeout
     });
@@ -182,7 +317,62 @@ export async function discoverPages(baseUrl, options = {}) {
     // Wait a bit more for any dynamic content
     await new Promise(r => setTimeout(r, 1000));
-    // Extract links using selectors
+    // =========================================
+    // SPA/Framework Detection (v1.3)
+    // =========================================
+    let frameworkInfo = null;
+    let frameworkRoutes = [];
+    let stateSnapshot = null;
+    if (!opts.noSpaDetect) {
+      // Framework detection
+      if (opts.framework) {
+        // User forced specific framework - validate it
+        const validatedFramework = validateFramework(opts.framework);
+        if (validatedFramework) {
+          frameworkInfo = {
+            framework: validatedFramework,
+            version: null,
+            routingType: 'spa',
+            confidence: 'forced',
+            signals: ['user-specified']
+          };
+        }
+      } else {
+        // Auto-detect framework
+        try {
+          frameworkInfo = await detectFramework(page);
+        } catch (e) {
+          logWarning(`Framework detection failed: ${e.message}`);
+          frameworkInfo = null;
+        }
+      }
+      // Framework-specific route discovery
+      if (frameworkInfo?.framework && opts.spaMode) {
+        try {
+          const discoveryResult = await discoverFrameworkRoutes(page, baseUrl, frameworkInfo);
+          frameworkRoutes = discoveryResult.routes || [];
+        } catch (e) {
+          logWarning(`Route discovery failed for ${frameworkInfo.framework}: ${e.message}`);
+          frameworkRoutes = [];
+        }
+      }
+      // Capture app state (optional)
+      if (opts.captureState && frameworkInfo) {
+        try {
+          stateSnapshot = await captureAppState(page, frameworkInfo);
+        } catch (e) {
+          logWarning(`State capture failed: ${e.message}`);
+          stateSnapshot = null;
+        }
+      }
+    }
+    // =========================================
+    // Traditional Link Scraping (existing logic)
+    // =========================================
     const selectors = opts.selectors || NAV_SELECTORS;
     const selectorString = selectors.join(', ');
@@ -196,13 +386,13 @@ export async function discoverPages(baseUrl, options = {}) {
     // Process and filter links
     const seenUrls = new Set();
-    const pages = [];
+    const linkScrapedPages = [];
     // Always include homepage first
     const homeUrl = normalizeUrl(baseUrl, '/');
     if (homeUrl) {
       seenUrls.add(homeUrl);
-      pages.push({
+      linkScrapedPages.push({
         path: '/',
         name: 'Home',
         url: homeUrl
@@ -232,14 +422,31 @@ export async function discoverPages(baseUrl, options = {}) {
       // Add to results
       seenUrls.add(normalized);
-      pages.push({
+      linkScrapedPages.push({
         path,
         name: extractPageName(link.text, path),
         url: normalized
       });
       // Check max pages limit
-      if (pages.length >= opts.maxPages) break;
+      if (linkScrapedPages.length >= opts.maxPages) break;
+    }
+    // =========================================
+    // Merge Routes (v1.3)
+    // =========================================
+    let pages;
+    if (frameworkRoutes.length > 0) {
+      // Merge framework routes with link-scraped pages
+      pages = mergeRoutes(frameworkRoutes, linkScrapedPages, baseDomain, baseUrl);
+    } else {
+      // No framework routes, use link-scraped pages only
+      pages = linkScrapedPages.map(p => ({ ...p, source: 'link-scrape', dynamic: false }));
+    }
+    // Apply max pages limit to merged results
+    if (pages.length > opts.maxPages) {
+      pages = pages.slice(0, opts.maxPages);
     }
     // Sort by path depth (shallow first)
@@ -257,25 +464,47 @@ export async function discoverPages(baseUrl, options = {}) {
       success: true,
       baseUrl: baseUrlObj.origin,
       baseDomain,
+      // SPA/Framework data (v1.3)
+      framework: frameworkInfo,
+      stateSnapshot: stateSnapshot,
+      // Page discovery results
       pages,
       stats: {
         totalLinksFound: rawLinks.length,
+        frameworkRoutesFound: frameworkRoutes.length,
         pagesDiscovered: pages.length,
         durationMs: duration
       }
     };
   } catch (error) {
+    // Normalize baseUrl in error case for consistency
+    let normalizedBaseUrl = baseUrl;
+    let errorBaseDomain = '';
+    try {
+      const urlObj = new URL(baseUrl);
+      normalizedBaseUrl = urlObj.origin;
+      errorBaseDomain = urlObj.hostname;
+    } catch {
+      // Keep original baseUrl if parsing fails
+    }
     return {
       success: false,
-      baseUrl,
+      baseUrl: normalizedBaseUrl,
+      baseDomain: errorBaseDomain,
+      framework: null,
+      stateSnapshot: null,
       pages: [{
         path: '/',
         name: 'Home',
-        url: normalizeUrl(baseUrl, '/') || baseUrl
+        url: normalizeUrl(baseUrl, '/') || baseUrl,
+        source: 'fallback',
+        dynamic: false
       }],
       error: error.message,
       stats: {
         totalLinksFound: 0,
+        frameworkRoutesFound: 0,
         pagesDiscovered: 1,
         durationMs: Date.now() - startTime
       }
@@ -287,11 +516,10 @@ export async function discoverPages(baseUrl, options = {}) {
   }
 }
-// CLI support
-const isMainModule = process.argv[1] && (
-  process.argv[1].endsWith('discover-pages.js') ||
-  process.argv[1].includes('discover-pages')
-);
+// CLI support - use exact file match to avoid triggering when imported
+import { fileURLToPath } from 'url';
+const __filename = fileURLToPath(import.meta.url);
+const isMainModule = process.argv[1] === __filename;
 if (isMainModule) {
   const url = process.argv[2];