@bcility/al-performance-mcp 2.1.2 → 2.1.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/package.json +35 -27
- package/server.py +2131 -6
package/server.py
CHANGED
|
@@ -1,6 +1,2131 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
b'#!/usr/bin/env python3
"""
AL Performance MCP Server
=========================
MCP server that scans AL source files for performance anti-patterns
and applies optimized fixes — based on the BC TechDays 2026 Workshop
(44 exercises covering real-world AL performance patterns).

Tools exposed:
  scan_al_workspace    — scan a folder for all performance issues
  fix_al_file          — apply all fixes to a single AL file
  fix_al_workspace     — apply all fixes to every AL file in a folder
  list_patterns        — list all known patterns with descriptions
  explain_pattern      — explain a single pattern in depth

Usage with Claude Desktop / VS Code Copilot:
  Add to mcp.json (see mcp.json in this folder)
"""

import re
import json
from pathlib import Path
from typing import Any

from mcp.server.fastmcp import FastMCP

mcp = FastMCP("AL Performance Analyzer")

# ---------------------------------------------------------------------------
# Pattern registry
# Each entry:
#   id          — short identifier used in findings
#   group       — category of issue
#   severity    — HIGH / MEDIUM / LOW
#   title       — one-line description
#   description — full explanation
#   exercises   — which workshop exercises cover this
#   detector    — callable(text) -> list[dict(line, snippet)]
#   fixer       — callable(text) -> str  (returns fixed text)
# ---------------------------------------------------------------------------

PATTERNS: list[dict] = []


def _register(id, group, severity, title, description, exercises):
    """Decorator factory that registers a pattern with its detector and fixer."""
    def decorator(cls):
        PATTERNS.append({
            "id": id,
            "group": group,
            "severity": severity,
            "title": title,
            "description": description,
            "exercises": exercises,
            "detector": cls.detect,
            "fixer": cls.fix,
        })
        return cls
    return decorator


def _find_line(text: str, char_offset: int) -> int:
    return text[:char_offset].count('\n') + 1


def _findings(text: str, pattern: re.Pattern, message_fn=None) -> list[dict]:
    out = []
    for m in pattern.finditer(text):
        line = _find_line(text, m.start())
        snippet = m.group(0).strip()[:120]
        out.append({"line": line, "snippet": snippet, "message": message_fn(m) if message_fn else ""})
    return out


# ───────────────────────────────────────────────────────────────────────
# PATTERN 01 — Missing SetLoadFields before FindSet / Find
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="MISSING_SETLOADFIELDS",
    group="Data Transfer",
    severity="HIGH",
    title="FindSet/Find without SetLoadFields",
    description=('Customer.FindSet() without SetLoadFields generates a SELECT with ALL 100+ fields — including every table extension column joined in. On each row, the NST deserialises a massive buffer it doesn\'t need.\n\nSQL IMPACT: SELECT \\"18\\".\\"timestamp\\",\\"18\\".\\"No_\\",\\"18\\".\\"Name\\"... (all 100+ columns) + JOIN extension tables.\nWith 10 000 customers that\'s gigabytes of needlessly transferred data.\n\nBAD:  if Customer.FindSet() then\nGOOD: Customer.SetLoadFields(\\"No.\\", Name, \\"Credit Limit (LCY)\\");\n      if Customer.FindSet() then\n\nHINT: Look at the SELECT in SQL Profiler. Count how many columns are fetched. Then add SetLoadFields and compare.'),
    exercises=[1, 2, 33],
)
class PatternMissingSetLoadFields:
    # Detect: FindSet/Find on a record variable NOT immediately preceded (within 3 lines) by SetLoadFields
    _FIND = re.compile(r'(\w+)\.(FindSet|FindFirst|FindLast|Find\()', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            m = re.search(r'(\w+)\.(FindSet|FindFirst|FindLast|Find\()', line)
            if not m:
                continue
            var = m.group(1)
            if var.lower() in ('true', 'false', 'result', 'rec'):
                continue
            # Check 3 lines above for SetLoadFields on same var
            context = '\n'.join(lines[max(0, i-3):i])
            if f'{var}.SetLoadFields' not in context and f'{var}.SetAutoCalcFields' not in context:
                # Exclude if in a comment
                stripped = line.strip()
                if stripped.startswith('//'):
                    continue
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": f"'{var}.{m.group(2)}' called without SetLoadFields"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        # This pattern requires context-specific fixes (which fields to load)
        # We annotate rather than blindly fix
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 02 — Find('-') buffer-size-1 anti-pattern
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="FIND_DASH_BUFFER_ONE",
    group="Data Transfer",
    severity="HIGH",
    title="Find('-') with buffer size 1 (use FindSet instead)",
    description=("Find('-') pre-fetches only 1 record at a time (read buffer = 1). Each call to Next() fires a new SQL query: SELECT TOP 50 ...\nFor 1 000 entries that is 20 round-trips instead of 1 with FindSet. Find('-') also ignores any previous SetCurrentKey call.\n\nSQL IMPACT: SELECT TOP 50 ... (repeated per Next() batch)\nvs FindSet: single SELECT that pre-fetches rows efficiently.\n\nBAD:  if Record.Find('-') then repeat ... until Record.Next() = 0;\nGOOD: if Record.FindSet() then repeat ... until Record.Next() = 0;\n\nHINT: Compare the number of SQL queries for Find('-') vs FindSet on 1 000 rows. Check the Reads column in Profiler."),
    exercises=[2, 24],
)
class PatternFindDash:
    _RE = re.compile(r"(\w+)\.Find\('-'\)", re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternFindDash._RE,
                         lambda m: f"Use FindSet() instead of {m.group(1)}.Find('-')")

    @staticmethod
    def fix(text: str) -> str:
        return PatternFindDash._RE.sub(lambda m: f"{m.group(1)}.FindSet()", text)


# ───────────────────────────────────────────────────────────────────────
# PATTERN 03 — CalcFields inside a loop
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="CALCFIELDS_IN_LOOP",
    group="FlowFields",
    severity="HIGH",
    title="CalcFields inside a repeat..until loop",
    description=('Calling CalcFields(Balance) inside a FindSet loop fires one extra SQL sub-query per iteration to compute the FlowField aggregate. For 500 vendors that is 500 extra SQL round-trips just for Balance. SetAutoCalcFields merges the FlowField into the main SELECT.\n\nSQL IMPACT: Per row: SELECT SUM(...) FROM \\"Detailed Vendor Ledg. Entry\\" ... = N additional queries inside the loop.\n\nBAD:  repeat Customer.CalcFields(Balance); until Customer.Next() = 0;\nGOOD: Customer.SetAutoCalcFields(Balance);\n      if Customer.FindSet() then repeat ... until Customer.Next() = 0;\n\nHINT: Count the extra SQL queries per loop iteration with CalcFields vs AutoCalcFields. Duration difference grows with record count.'),
    exercises=[3],
)
class PatternCalcFieldsInLoop:
    _RE = re.compile(r'^\s+\w+\.CalcFields\([^)]+\);', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        in_loop = False
        depth = 0
        for i, line in enumerate(lines):
            stripped = line.strip()
            if stripped.lower() == 'repeat':
                in_loop = True
                depth += 1
            if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE):
                depth -= 1
                if depth <= 0:
                    in_loop = False
            if in_loop and re.search(r'\w+\.CalcFields\(', line):
                if not stripped.startswith('//'):
                    findings.append({
                        "line": i + 1,
                        "snippet": line.strip()[:120],
                        "message": "CalcFields() inside loop — use SetAutoCalcFields() before FindSet()"
                    })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text  # Context-specific; needs the variable name


# ───────────────────────────────────────────────────────────────────────
# PATTERN 04 — Record parameter passed by value (missing var)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="RECORD_BY_VALUE",
    group="Memory / Copies",
    severity="MEDIUM",
    title="Record parameter passed by value instead of var",
    description=('Without VAR, AL copies the entire Record instance into a new memory block: all field values, filter state, cursor position. Large records (Customer, Item) copied on every call. With many nested calls this causes significant GC pressure on NST.\n\nSQL IMPACT: No SQL change — overhead is in NST memory allocation & copy.\n\nBAD:  local procedure Foo(Customer: Record Customer)\nGOOD: local procedure Foo(var Customer: Record Customer)\n\nHINT: No SQL difference — measure NST throughput and allocation counters.'),
    exercises=[4],
)
class PatternRecordByValue:
    _RE = re.compile(
        r'(local\s+procedure|procedure)\s+\w+\((?:[^)]*,\s*)?(\w+):\s*Record\s+[^;)]+\)',
        re.MULTILINE
    )

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        for m in PatternRecordByValue._RE.finditer(text):
            line_text = text[max(0, m.start()-200):m.end()]
            if '(var ' in m.group(0) or re.search(r'\bvar\s+\w+:\s*Record', m.group(0)):
                continue
            if m.group(2) == 'var':
                continue
            line = _find_line(text, m.start())
            findings.append({
                "line": line,
                "snippet": m.group(0)[:120],
                "message": "Record parameter without 'var' — creates a full copy on each call"
            })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 05 — Loop sum instead of CalcSums
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="LOOP_SUM_VS_CALCSUMS",
    group="Aggregation",
    severity="HIGH",
    title="Manual summation loop instead of CalcSums",
    description=('Summing a field by iterating all rows in AL: fetches every row from SQL, deserialises it in NST, accumulates in a local variable. CalcSums(Amount) translates to a SQL SUM() aggregate — computed at the database, returns a single row.\n\nSQL IMPACT: Manual loop: SELECT all rows, process N rows in NST\nCalcSums:    SELECT SUM(\\"Amount\\") ... — returns 1 row.\n\nBAD:  repeat Total += Record.Amount; until Record.Next() = 0;\nGOOD: Record.CalcSums(Amount); Total := Record.Amount;\n\nHINT: CalcSums result: 1 SQL row returned. Loop result: N SQL rows fetched and summed. Check Reads: CalcSums = 1, loop = N.'),
    exercises=[5],
)
class PatternLoopSum:
    _RE = re.compile(r'(\w+)\s*\+=\s*\w+\.\w+;', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        in_loop = False
        for i, line in enumerate(lines):
            stripped = line.strip()
            if stripped.lower() == 'repeat':
                in_loop = True
            if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE):
                in_loop = False
            if in_loop and PatternLoopSum._RE.search(line) and not stripped.startswith('//'):
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": "Manual += accumulation in loop — consider CalcSums() if summing a single field"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 06 — String concatenation += in loop (use TextBuilder)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="STRING_CONCAT_IN_LOOP",
    group="Memory / Copies",
    severity="HIGH",
    title="Text += string concatenation in loop (O(n²)) — use TextBuilder",
    description=("AL's Text type is a value type. Each += creates a brand-new string object in NST memory — old strings become GC garbage immediately. For N iterations: O(N²) memory allocations and copies. TextBuilder wraps .NET StringBuilder: O(N) time, no intermediate copies.\n\nSQL IMPACT: No SQL impact — pure NST memory pressure & GC overhead.\n\nBAD:  CsvContent += BuildDetailLine(...);\nGOOD: var Builder: TextBuilder;\n      Builder.Append(BuildDetailLine(...));\n      Result := Builder.ToText(); // Single allocation at end\n\nHINT: The GC pressure is invisible in SQL Profiler but shows up in NST memory counters."),
    exercises=[6],
)
class PatternStringConcatInLoop:
    _RE = re.compile(r'(\w+)\s*\+=\s*(?![\d.])', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        in_loop = False
        for i, line in enumerate(lines):
            stripped = line.strip()
            if stripped.lower() == 'repeat' or re.search(r'\bforeach\b', stripped, re.IGNORECASE):
                in_loop = True
            if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE) or stripped == 'end;':
                in_loop = False
            if in_loop:
                m = PatternStringConcatInLoop._RE.search(line)
                if m and not stripped.startswith('//'):
                    var = m.group(1)
                    # Look back to see if it's declared as Text
                    context = '\n'.join(lines[max(0, i-30):i])
                    if re.search(rf'\b{re.escape(var)}\s*:\s*Text\b', context):
                        findings.append({
                            "line": i + 1,
                            "snippet": line.strip()[:120],
                            "message": f"Text += in loop creates O(n²) allocations — use TextBuilder"
                        })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 07 — FindSet without (true) when modifying via cursor
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="FINDSET_MODIFY_NO_TRUE",
    group="Locking",
    severity="MEDIUM",
    title="FindSet() without (true) when Modify is called on cursor variable",
    description=('FindSet uses ReadUncommitted isolation and pre-fetches rows in batches. Calling Modify inside the loop body can invalidate the cursor position. Records may be visited twice, skipped entirely, or cause deadlocks. The cursor is not designed to survive concurrent DML on the same rows.\n\nSQL IMPACT: SELECT TOP 50 ... (ReadUncommitted) then UPDATE inside — cursor instability.\n\nBAD:  if Record.FindSet() then repeat Record.Field := ...; Record.Modify(); ...\nGOOD: if Record.FindSet(true) then repeat Record.Field := ...; Record.Modify(); ...\n\nHINT: Use SQL Profiler to watch which records get updated. Run the anti-pattern twice — some records may be updated twice or skipped.'),
    exercises=[7],
)
class PatternFindSetNoForUpdate:
    _RE = re.compile(r'(\w+)\.FindSet\(\)', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            m = PatternFindSetNoForUpdate._RE.search(line)
            if not m or line.strip().startswith('//'):
                continue
            var = m.group(1)
            # Look ahead for Modify on the same var
            ahead = '\n'.join(lines[i:min(len(lines), i+15)])
            if re.search(rf'\b{re.escape(var)}\.Modify\(', ahead):
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": f"'{var}.FindSet()' but '{var}.Modify()' found in loop — use FindSet(true)"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        # Only fix when Modify follows in same loop — conservative approach
        def replace_if_modify_follows(m):
            pos = m.end()
            ahead = text[pos:pos+500]
            var = m.group(1)
            if re.search(rf'\b{re.escape(var)}\.Modify\(', ahead):
                return f"{var}.FindSet(true)"
            return m.group(0)
        return re.sub(r'(\w+)\.FindSet\(\)', replace_if_modify_follows, text)


# ───────────────────────────────────────────────────────────────────────
# PATTERN 08 — Delete inside a loop (use DeleteAll)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="DELETE_IN_LOOP",
    group="Bulk Operations",
    severity="HIGH",
    title="Record.Delete() inside a loop — use DeleteAll()",
    description=('Same cursor instability as Modify — Delete during FindSet can cause the read cursor to skip or revisit records. DeleteAll is atomic and uses a single DELETE FROM statement. If selective deletion is needed, collect keys first, delete after loop.\n\nSQL IMPACT: SELECT TOP 50 (cursor) + DELETE per row — cursor corruption risk.\nDeleteAll: 1 DELETE FROM statement vs N individual DELETEs.\n\nBAD:  if Record.FindSet() then repeat Record.Delete(); until Record.Next() = 0;\nGOOD: Record.SetRange(Active, false); Record.DeleteAll(false);\n\nHINT: Compare the number of DELETE statements in Profiler: DeleteAll = 1 SQL DELETE; loop = N DELETEs.'),
    exercises=[8],
)
class PatternDeleteInLoop:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        in_loop = False
        loop_var = None
        for i, line in enumerate(lines):
            stripped = line.strip()
            m = re.search(r'(\w+)\.FindSet', line)
            if m and not stripped.startswith('//'):
                in_loop = True
                loop_var = m.group(1)
            if in_loop and loop_var and re.search(rf'\b{re.escape(loop_var)}\.Delete\(', line):
                if not stripped.startswith('//'):
                    findings.append({
                        "line": i + 1,
                        "snippet": line.strip()[:120],
                        "message": f"'{loop_var}.Delete()' inside FindSet loop — use '{loop_var}.DeleteAll(false)'"
                    })
            if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE):
                in_loop = False
                loop_var = None
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 09 — Count() <> 0 instead of not IsEmpty()
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="COUNT_NOT_ZERO",
    group="Existence Checks",
    severity="MEDIUM",
    title="Count() <> 0 / Count() > 0 — use IsEmpty() instead",
    description=('Count() generates SELECT COUNT(*) — the database must count ALL matching rows before returning. On large tables this is expensive. IsEmpty() generates IF EXISTS (SELECT TOP 1 NULL ...) — stops at the first match. O(1) vs O(N).\n\nSQL IMPACT: Count():   SELECT COUNT(*) FROM ... → scans entire table\nIsEmpty(): IF EXISTS (SELECT TOP 1 NULL FROM ...) → stops immediately.\n\nBAD:  exit(Record.Count() <> 0);\nGOOD: exit(not Record.IsEmpty());\n\nHINT: Compare SQL Profiler output for both. Count() always reads all rows first. IsEmpty stops at the very first match.'),
    exercises=[9, 10, 11],
)
class PatternCountNotZero:
    _RE = re.compile(r'(\w+)\.Count\(\)\s*(?:<>|>|=)\s*0', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternCountNotZero._RE,
                         lambda m: f"'{m.group(1)}.Count() != 0' — use IsEmpty() for O(1) existence check")

    @staticmethod
    def fix(text: str) -> str:
        def replace(m):
            var = m.group(1)
            op = m.group(0).split('Count()')[1].strip().split(' ')[0]
            if op in ('<>', '>'):
                return f'not {var}.IsEmpty()'
            if op == '=':
                return f'{var}.IsEmpty()'
            return m.group(0)
        return PatternCountNotZero._RE.sub(replace, text)


# ───────────────────────────────────────────────────────────────────────
# PATTERN 10 — Redundant IsEmpty before FindSet (double scan)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="ISEMPTY_BEFORE_FINDSET",
    group="Existence Checks",
    severity="MEDIUM",
    title="Redundant IsEmpty() before FindSet() (two SQL scans instead of one)",
    description=('Checking IsEmpty() immediately before FindSet fires TWO SQL queries: 1) IF EXISTS (SELECT TOP 1 NULL ...) — the IsEmpty check; 2) SELECT TOP 50 ... — the FindSet. FindSet already returns false when no rows match — the IsEmpty is waste.\n\nSQL IMPACT: Query 1: IF EXISTS (SELECT TOP 1 NULL ...). Query 2: SELECT TOP 50 ... → redundant.\n\nBAD:  if not Record.IsEmpty() then\n          if Record.FindSet() then ...\nGOOD: if Record.FindSet() then ...\n\nHINT: Count the SQL queries in Profiler: IsEmpty + FindSet = 2; just FindSet = 1. The IsEmpty result is ignored by FindSet anyway.'),
    exercises=[11],
)
class PatternIsEmptyBeforeFindSet:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            if re.search(r'not\s+\w+\.IsEmpty\(\)', line) and not line.strip().startswith('//'):
                # Check next 2 lines for FindSet
                ahead = '\n'.join(lines[i:min(len(lines), i+3)])
                if re.search(r'\.FindSet\(', ahead):
                    findings.append({
                        "line": i + 1,
                        "snippet": line.strip()[:120],
                        "message": "Redundant IsEmpty() guard before FindSet() — FindSet() returns false when empty"
                    })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return re.sub(
            r'[ \t]+if not (\w+)\.IsEmpty\(\) then\s*\n([ \t]+)if \1\.FindSet\(',
            r'\2if \1.FindSet(',
            text
        )


# ───────────────────────────────────────────────────────────────────────
# PATTERN 11 — Missing 'temporary' keyword on temp table variable
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="MISSING_TEMPORARY",
    group="Memory / Copies",
    severity="HIGH",
    title="Temp table variable missing 'temporary' keyword",
    description=('A non-temporary record sends every Insert/Get/Delete to SQL Server. Using a regular table as an in-memory scratchpad causes unnecessary SQL round-trips, transaction log writes, and lock contention. Declaring the variable \'temporary\' keeps all operations in NST memory.\n\nSQL IMPACT: Without temporary: INSERT INTO / SELECT / DELETE — full SQL for each op.\nWith temporary: All operations in NST memory — zero SQL round-trips.\n\nBAD:  TempData: Record \\"Workshop Data\\";\nGOOD: TempData: Record \\"Workshop Data\\" temporary;\n\nHINT: Insert 1 000 rows with and without \'temporary\'. Without: watch 1 000 INSERTs in SQL Profiler. With temporary: zero SQL activity.'),
    exercises=[12],
)
class PatternMissingTemporary:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            # Variable declared with Temp prefix but no 'temporary' keyword
            if re.search(r'\bTemp\w+\s*:\s*Record\s+', line) and 'temporary' not in line and not line.strip().startswith('//'):
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": "Variable with 'Temp' prefix is missing 'temporary' keyword"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return re.sub(
            r'(Temp\w+\s*:\s*Record\s+[^;]+);(?!\s*//.*temporary)',
            lambda m: m.group(0).rstrip(';') + ' temporary;' if 'temporary' not in m.group(0) else m.group(0),
            text
        )


# ───────────────────────────────────────────────────────────────────────
# PATTERN 12 — Temp table used as Dictionary (use Dictionary type)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="TEMP_TABLE_AS_DICT",
    group="Memory / Copies",
    severity="MEDIUM",
    title="Temp Record table used as a key-value lookup (use Dictionary instead)",
    description=("Even a 'temporary' table carries record-layer overhead: key indexes, transaction state tracking, schema validation on every operation. For simple key→value mapping (e.g. CustomerNo → SalespersonCode), the built-in Dictionary of [K, V] type has zero DB overhead.\n\nSQL IMPACT: Temp table: key index maintenance, record struct overhead per entry.\nDictionary: direct hash map lookup — O(1) Get/Set, no record overhead.\n\nBAD:  TempCustomer: Record Customer temporary; TempCustomer.Insert(); TempCustomer.Get(...);\nGOOD: RoutingMap: Dictionary of [Code[20], Code[20]];\n      RoutingMap.Set(..., ...); if RoutingMap.ContainsKey(...) then ...\n\nHINT: Compare Get/Set operations on temp table vs Dictionary. Measure time for 10 000 lookups each way."),
    exercises=[13],
)
class PatternTempTableAsDict:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            m = re.search(r'(Temp\w+)\s*:\s*Record\s+\S+\s+temporary', line)
            if not m:
                continue
            var = m.group(1)
            # Look ahead for both Insert and Get on same var — classic dict pattern
            rest = '\n'.join(lines[i:min(len(lines), i+60)])
            if re.search(rf'\b{re.escape(var)}\.Insert\(', rest) and re.search(rf'\b{re.escape(var)}\.Get\(', rest):
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": f"'{var}' used as key-value store (Insert+Get pattern) — prefer Dictionary of [...]"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 13 — FindFirst() used for loop iteration
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="FINDFIRST_IN_LOOP",
    group="Data Transfer",
    severity="HIGH",
    title="FindFirst() used for multi-row iteration (buffer size 1)",
    description=('FindFirst() generates SELECT TOP 1 — fetches exactly one record. When used to start a loop (calling Next() repeatedly), every Next() call that exhausts the buffer fires a new SELECT TOP 50. FindSet() pre-fetches 50 rows immediately — far fewer SQL queries.\n\nSQL IMPACT: FindFirst: SELECT TOP 1 ... then SELECT TOP 50 per batch in Next().\nFindSet:   Single SELECT that establishes the full read cursor.\n\nBAD:  if Record.FindFirst() then repeat ... until Record.Next() = 0;\nGOOD: if Record.FindSet() then repeat ... until Record.Next() = 0;\n\nHINT: Trace SQL queries for a 500-row loop with FindFirst. FindFirst fires SELECT TOP 1 first, then Next batches. FindSet fires one SELECT and handles batching internally.'),
    exercises=[14],
)
class PatternFindFirstInLoop:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            m = re.search(r'(\w+)\.FindFirst\(\)', line)
            if not m or line.strip().startswith('//'):
                continue
            var = m.group(1)
            # Look ahead for Next() on same var
            ahead = '\n'.join(lines[i:min(len(lines), i+20)])
            if re.search(rf'\b{re.escape(var)}\.Next\(\)', ahead):
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": f"'{var}.FindFirst()' followed by Next() — use FindSet() for multi-row iteration"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        def replace(m):
            var = m.group(1)
            pos = m.end()
            ahead = text[pos:pos+300]
            if re.search(rf'\b{re.escape(var)}\.Next\(\)', ahead):
                return f"{var}.FindSet()"
            return m.group(0)
        return re.sub(r'(\w+)\.FindFirst\(\)', replace, text)


# ───────────────────────────────────────────────────────────────────────
# PATTERN 14 — FindSet guard before ModifyAll (unnecessary)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="FINDSET_BEFORE_MODIFYALL",
    group="Bulk Operations",
    severity="MEDIUM",
    title="FindSet() guard before ModifyAll() — unnecessary (double scan)",
    description=('Calling FindSet() immediately before ModifyAll() fires an extra SELECT just to confirm rows exist. ModifyAll() already handles empty result sets gracefully — it does nothing if no rows match the current filters. The FindSet is pure overhead with zero functional benefit.\n\nSQL IMPACT: Extra query: SELECT TOP 50 ... (only to check existence).\nThen: UPDATE ... WHERE ... (ModifyAll — does this anyway).\nWith FindSet: 2 queries (SELECT + UPDATE). Without: 1 query (UPDATE only).\n\nBAD:  if Record.FindSet() then Record.ModifyAll(...);\nGOOD: Record.ModifyAll(...);\n\nHINT: Look at SQL before ModifyAll with and without FindSet. With FindSet: 2 queries. Without: 1 query.'),
    exercises=[15],
)
class PatternFindSetBeforeModifyAll:
    _RE = re.compile(r'if\s+(\w+)\.FindSet\(\)\s+then\s+\n?\s+\1\.ModifyAll\(', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternFindSetBeforeModifyAll._RE,
                         lambda m: f"FindSet() guard before ModifyAll() on '{m.group(1)}' is redundant")

    @staticmethod
    def fix(text: str) -> str:
        return re.sub(
            r'if\s+(\w+)\.FindSet\(\)\s+then\s*\n(\s+)\1\.ModifyAll\(',
            r'\2\1.ModifyAll(',
            text
        )


# ───────────────────────────────────────────────────────────────────────
# PATTERN 15 — SetFilter on FlowField (use SetAutoCalcFields + AL filter)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="SETFILTER_ON_FLOWFIELD",
    group="FlowFields",
    severity="HIGH",
    title="SetFilter on FlowField causes correlated subquery per row",
    description=("SetFilter on a FlowField (e.g. Balance, which is a CalcField) cannot be pushed to the SQL WHERE clause — it has no physical column. BC must fetch ALL rows matching the other filters, then compute the FlowField for each row individually and filter in AL. Full table scan.\n\nSQL IMPACT: SELECT all rows ... then per row: SELECT SUM(...) for FlowField.\nSQL cannot filter on a computed value it hasn't calculated yet.\n\nBAD:  Customer.SetFilter(Balance, '>%1', 0); if Customer.FindSet() then ...\nGOOD: Customer.SetAutoCalcFields(Balance);\n      if Customer.FindSet() then repeat if Customer.Balance > 0 then ...\n\nHINT: Try SetFilter(Balance, '>1000') — check the SQL WHERE. Balance won't appear in WHERE — all rows fetched. Compare with filtering on a normal indexed decimal field."),
    exercises=[16],
)
class PatternSetFilterOnFlowField:
    # Common FlowFields in BC
    _FLOWFIELDS = {'Balance', 'Balance (LCY)', 'Sales (LCY)', 'Purchases (LCY)',
                   'Outstanding Orders', 'Outstanding Invoices', 'Net Change'}
    _RE = re.compile(r'(\w+)\.SetFilter\(([^,)]+),', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        for m in PatternSetFilterOnFlowField._RE.finditer(text):
            field = m.group(2).strip().strip('"')
            if field in PatternSetFilterOnFlowField._FLOWFIELDS:
                line = _find_line(text, m.start())
                findings.append({
                    "line": line,
                    "snippet": m.group(0)[:120],
                    "message": f"SetFilter on FlowField '{field}' — use SetAutoCalcFields + AL-side filter"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 16 — OR / AND both sides always evaluated (use nested IF)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="EAGER_EVALUATION_OR_AND",
    group="Short-Circuit Evaluation",
    severity="MEDIUM",
    title="AL 'or'/'and' evaluates both sides eagerly — use nested IF for expensive calls",
    description=('AL evaluates BOTH sides of OR/AND regardless of the left side result. If the left condition calls an expensive function (FindSet, CalcFields), the right side still runs even when left already determines the result. Nested IF statements provide proper short-circuit behavior.\n\nSQL IMPACT: No SQL change — both function calls execute unconditionally.\nWith nested IF: expensive right-side call skipped when left is true/false.\n\nBAD:  if ExpensiveA() or ExpensiveB() then\nGOOD: if ExpensiveA() then ProcessResult()\n      else if ExpensiveB() then ProcessResult();\n\nHINT: Add trace messages inside each expensive function. Count how many times each is called with OR vs nested IF. Right-side function should not run when left is true.'),
    exercises=[17, 18, 39],
)
class PatternEagerEvaluation:
    # Heuristic: function calls as operands of or/and
    _RE = re.compile(r'\b(\w+\([^)]*\))\s+(or|and)\s+(\w+\([^)]*\))', re.MULTILINE | re.IGNORECASE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        for m in PatternEagerEvaluation._RE.finditer(text):
            if text[max(0, m.start()-2):m.start()].strip().startswith('//'):
                continue
            line = _find_line(text, m.start())
            line_text = text.splitlines()[line-1].strip()
            if line_text.startswith('//'):
                continue
            findings.append({
                "line": line,
                "snippet": m.group(0)[:120],
                "message": f"Eager evaluation: '{m.group(2).upper()}' always evaluates both sides — use nested IF or 'case true of'"
            })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text  # Requires understanding of intent


# ───────────────────────────────────────────────────────────────────────
# PATTERN 17 — SetRange/filter mutation inside FindSet loop
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="FILTER_MUTATION_IN_LOOP",
    group="Cursor Safety",
    severity="HIGH",
    title="SetRange/SetFilter inside FindSet loop corrupts cursor",
    description=("Setting a new filter inside a FindSet loop modifies the record variable's filter state. Next() continues on the OLD cursor, not the new filter. Result: records may be missed, wrong data returned, or infinite loop. The cursor position becomes undefined after a SetRange mid-loop.\n\nSQL IMPACT: Cursor established by FindSet, then filter changed → Next() undefined behavior. Hard to reproduce bugs.\n\nBAD:  if Rec.FindSet() then repeat Rec.SetRange(Field, Rec.Field); until Rec.Next()=0;\nGOOD: Collect keys into a List first, then process with Get().\n\nHINT: Set a breakpoint inside the loop after SetRange. Watch which records Next() returns after the filter change."),
    exercises=[19],
)
class PatternFilterMutationInLoop:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        in_loop = False
        loop_var = None
        for i, line in enumerate(lines):
            m = re.search(r'(\w+)\.FindSet', line)
            if m and not line.strip().startswith('//'):
                in_loop = True
                loop_var = m.group(1)
            if in_loop and loop_var:
                if re.search(rf'\b{re.escape(loop_var)}\.(SetRange|SetFilter)\(', line) and not line.strip().startswith('//'):
                    findings.append({
                        "line": i + 1,
                        "snippet": line.strip()[:120],
                        "message": f"'{loop_var}.SetRange/SetFilter' inside FindSet loop — corrupts cursor"
                    })
            if re.match(r'until\s+\w+\.Next\(\)', line.strip(), re.IGNORECASE):
                in_loop = False
                loop_var = None
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 18 — FindSet before DeleteAll (unnecessary guard)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="FINDSET_BEFORE_DELETEALL",
    group="Bulk Operations",
    severity="MEDIUM",
    title="FindSet() guard before DeleteAll() is redundant",
    description=('Same anti-pattern as FindSet before ModifyAll — calling FindSet() before DeleteAll() fires an extra SELECT just to verify rows exist. DeleteAll() already handles empty result sets — it does nothing.\n\nSQL IMPACT: Extra query: SELECT TOP 50 ... (only to check existence).\nThen: DELETE FROM ... WHERE ... (DeleteAll — does this anyway).\nFindSet before DeleteAll = 2 SQL queries. Just DeleteAll = 1 SQL DELETE statement.\n\nBAD:  if Record.FindSet() then Record.DeleteAll();\nGOOD: Record.DeleteAll();\n\nHINT: Same as FindSet before ModifyAll but for DeleteAll. With FindSet: 2 queries. Without: 1 DELETE statement.'),
    exercises=[20],
)
class PatternFindSetBeforeDeleteAll:
    _RE = re.compile(r'if\s+(\w+)\.FindSet\(\)\s+then\s*\n?\s*\1\.DeleteAll\(', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternFindSetBeforeDeleteAll._RE,
                         lambda m: f"FindSet() guard before DeleteAll() on '{m.group(1)}' is redundant")

    @staticmethod
    def fix(text: str) -> str:
        return re.sub(
            r'if\s+(\w+)\.FindSet\(\)\s+then\s*\n(\s+)\1\.DeleteAll\(',
            r'\2\1.DeleteAll(',
            text
        )


# ───────────────────────────────────────────────────────────────────────
# PATTERN 19 — DeleteAll without IsEmpty guard on lock-sensitive records
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="DELETEALL_NO_ISEMPTY_GUARD",
    group="Locking",
    severity="LOW",
    title="DeleteAll() without IsEmpty guard acquires write lock even when empty",
    description=('DeleteAll() on an empty (or likely-empty) table still fires a DELETE FROM ... SQL statement — acquiring a write lock even if there are zero rows to delete. Under high concurrency, unnecessary lock acquisition causes contention.\n\nSQL IMPACT: DELETE FROM ... WHERE ... → acquires write lock even if 0 rows affected.\nIsEmpty guard: IF EXISTS check first → skip DELETE if empty.\n\nCONSIDER: if not Record.IsEmpty() then Record.DeleteAll(false);\n\nHINT: Call DeleteAll on an empty table in SQL Profiler. Without guard: DELETE fires even with 0 rows. With IsEmpty guard: DELETE skipped entirely.'),
    exercises=[21],
)
class PatternDeleteAllNoGuard:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            m = re.search(r'(\w+)\.DeleteAll\(', line)
            if not m or line.strip().startswith('//'):
                continue
            var = m.group(1)
            # Check 2 lines above for IsEmpty guard on same var
            context = '\n'.join(lines[max(0, i-2):i])
            if f'{var}.IsEmpty' not in context:
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": f"Consider 'if not {var}.IsEmpty() then' guard before DeleteAll() to avoid locking on empty sets"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 20 — Count() = 1 "exactly one" check (use FindFirst + Next)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="COUNT_EQUALS_ONE",
    group="Existence Checks",
    severity="MEDIUM",
    title="Count() = 1 to check uniqueness scans entire set",
    description=("Count() = 1 requires the database to count ALL matching rows. To check 'exactly one record exists', you only need to fetch two rows: FindFirst() gets the first, Next() = 0 confirms there is no second. Maximum 2 row reads.\n\nSQL IMPACT: Count() = 1: SELECT COUNT(*) FROM ... → full table scan.\nFindFirst + Next: SELECT TOP 1 then SELECT TOP 1 → max 2 rows read.\n\nBAD:  exit(Record.Count() = 1);\nGOOD: if Record.FindFirst() then exit(Record.Next() = 0)\n      else exit(false);\n\nHINT: Compare SQL for Count()=1 vs FindFirst+Next approach. Count() reads entire matching set. FindFirst+Next reads at most 2 rows."),
    exercises=[22],
)
class PatternCountEqualsOne:
    _RE = re.compile(r'(\w+)\.Count\(\)\s*=\s*1', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternCountEqualsOne._RE,
                         lambda m: f"Count() = 1 scans entire set — use FindFirst() + Next() = 0")

    @staticmethod
    def fix(text: str) -> str:
        def replace(m):
            var = m.group(1)
            # Look at context to see if it's in an exit()
            return f'{var}.FindFirst() and ({var}.Next() = 0)'
        return PatternCountEqualsOne._RE.sub(replace, text)


# ───────────────────────────────────────────────────────────────────────
# PATTERN 21 — Insert-on-conflict pattern (try Insert first, Modify on fail)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="INSERT_ON_CONFLICT",
    group="Write Patterns",
    severity="MEDIUM",
    title="Insert-on-conflict anti-pattern (try Insert, Modify on fail)",
    description=('The Insert always fires. On duplicate key, SQL raises a constraint error that is caught and triggers a Modify. Error handling in SQL is extremely expensive — each conflict = a rolled-back statement + error event.\n\nSQL IMPACT: On conflict: INSERT (fails) → SQL error → error handling → UPDATE.\nWith Get: SELECT (1 row) → branch → INSERT or UPDATE (no errors).\n\nBAD:  if not Record.Insert(false) then Record.Modify(false);\nGOOD: if Record.Get(KeyValue) then Record.Modify(false)\n      else begin Record.Init(); Record.Insert(false); end;\n\nHINT: On conflict: INSERT path fires a SQL error event — visible in Profiler. Get+branch: no error events.'),
    exercises=[23],
)
class PatternInsertOnConflict:
    _RE = re.compile(r'if not \w+\.Insert\((?:false|true)?\) then\s+\w+\.Modify\(', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternInsertOnConflict._RE,
                         lambda m: "Insert-on-fail pattern — use Get() then Modify/Insert for clarity and efficiency")

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 22 — SetCurrentKey missing for sorted iteration
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="MISSING_SETCURRENTKEY",
    group="Sort / Keys",
    severity="MEDIUM",
    title="Find('-') or FindSet without SetCurrentKey when order matters",
    description=('Find(\'-\') always reads in PRIMARY KEY ascending order, regardless of any SetCurrentKey call made before it. To read data in a specific sort order, use FindSet() after SetCurrentKey and (for descending) SetAscending(false).\n\nSQL IMPACT: Find(\'-\'): always ORDER BY primary key ASC — SetCurrentKey ignored.\nFindSet with SetAscending: ORDER BY <key> DESC — correct ordering.\n\nBAD:  Record.SetCurrentKey(\\"Posting Date\\"); if Record.Find(\'-\') then ...\nGOOD: Record.SetCurrentKey(\\"Posting Date\\");\n      Record.SetAscending(\\"Posting Date\\", false);\n      if Record.FindSet() then ...\n\nHINT: Check ORDER BY in SQL after Find(\'-\') with SetCurrentKey. SetCurrentKey is ignored — ORDER BY uses primary key.'),
    exercises=[24],
)
class PatternMissingSetCurrentKey:
    @staticmethod
    def detect(text: str) -> list[dict]:
        return []  # Covered by FIND_DASH_BUFFER_ONE; too context-specific to detect generically

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 23 — Temp table as collection (use List/Dictionary)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="TEMP_TABLE_AS_COLLECTION",
    group="Memory / Copies",
    severity="MEDIUM",
    title="Temporary table used purely as a collection (use List or Dictionary)",
    description=('Using a temporary table purely to collect distinct scalar values (dates, IDs, codes) carries full record-layer overhead: schema validation, key index maintenance, Init/Insert/FindSet calls. List of [T] is a native AL type with zero record overhead.\n\nSQL IMPACT: Temp table Insert/FindSet: record struct overhead per value.\nList of [Date]: direct array access, no schema, no key lookup.\n\nBAD:  TempDates: Record \\"Workshop Data\\" temporary; TempDates.\\"Posting Date\\" := ...; TempDates.Insert();\nGOOD: Dates: List of [Date]; if not Dates.Contains(PostingDate) then Dates.Add(PostingDate);\n\nHINT: Compare temp table Insert/FindSet vs List.Add/iteration. Temp table: schema overhead even in memory. List: pure NST memory array.'),
    exercises=[25],
)
class PatternTempTableAsCollection:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            m = re.search(r'(Temp\w+)\s*:\s*Record\s+\S+\s+temporary', line)
            if not m:
                continue
            var = m.group(1)
            rest = '\n'.join(lines[i:min(len(lines), i+80)])
            # Pure collection: Insert without reading back meaningful fields
            has_insert = bool(re.search(rf'\b{re.escape(var)}\.Insert\(', rest))
            has_get = bool(re.search(rf'\b{re.escape(var)}\.Get\(', rest))
            has_setrange = bool(re.search(rf'\b{re.escape(var)}\.SetRange\(', rest))
            if has_insert and has_setrange and not has_get:
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": f"'{var}' used as collection (Insert+SetRange, no Get) — use List of [...] instead"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 24 — FindLast / FindFirst inside a loop
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="FINDLAST_IN_LOOP",
    group="Data Transfer",
    severity="HIGH",
    title="FindLast()/FindFirst() inside a loop (call once before the loop)",
    description=('Calling FindLast() inside a loop to determine the next Entry No. fires SELECT MAX(\\"Entry No_\\") ... or ORDER BY DESC FETCH 1 on EVERY iteration. For 5 000 lines that is 5 000 SQL round-trips for a counter. One FindLast() before the loop + a local counter is O(1).\n\nSQL IMPACT: Per iteration: SELECT TOP 1 ... ORDER BY \\"Entry No_\\" DESC = N SQL queries.\n\nBAD:  foreach Line in ImportSource do begin Record.FindLast(); NextNo := Record.\\"Entry No.\\" + 1; ...\nGOOD: Record.FindLast(); NextNo := Record.\\"Entry No.\\" + 1;\n      foreach Line in ImportSource do begin NextNo += 1; ... end;\n\nHINT: Trace FindLast() calls in the loop with SQL Profiler. Each iteration fires ORDER BY DESC FETCH 1. Single FindLast before loop: 1 SQL query total.'),
    exercises=[26],
)
class PatternFindLastInLoop:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        in_loop = False
        for i, line in enumerate(lines):
            stripped = line.strip()
            if re.search(r'\bforeach\b|\brepeat\b', stripped, re.IGNORECASE):
                in_loop = True
            if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE) or (stripped == 'end;' and in_loop):
                in_loop = False
            if in_loop and re.search(r'\w+\.(FindLast|FindFirst)\(\)', line) and not stripped.startswith('//'):
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": "FindLast/FindFirst inside loop — call once before the loop and cache the result"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 25 — LockTable + FindLast for sequence generation (use NumberSequence)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="LOCKTABLE_FOR_SEQUENCE",
    group="Locking",
    severity="HIGH",
    title="LockTable + FindLast for sequence numbers — use NumberSequence",
    description=("LockTable() acquires a full table-level exclusive write lock held for the entire transaction. Any concurrent session needing this table blocks. Under high-volume processing (hundreds of operations per minute) this creates lock wait queues and eventual timeout errors.\n\nSQL IMPACT: LockTable: X-lock on entire table for transaction duration.\nNumberSequence.Next(): atomic counter at DB level — no table lock.\n\nBAD:  Record.LockTable(true); if Record.FindLast() then NextNo := Record.PK + 1;\nGOOD: if not NumberSequence.Exists('MY_SEQ') then NumberSequence.Insert('MY_SEQ',1,1,false);\n      NextNo := NumberSequence.Next('MY_SEQ');\n\nHINT: LockTable: watch lock events in SQL Profiler. NumberSequence: no table lock — atomic sequence increment. Compare concurrency: run two sessions simultaneously."),
    exercises=[28],
)
class PatternLockTableForSequence:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            if re.search(r'\w+\.LockTable\(', line) and not line.strip().startswith('//'):
                # Look ahead for FindLast to get next key
                ahead = '\n'.join(lines[i:min(len(lines), i+8)])
                if re.search(r'FindLast\(\)', ahead) and re.search(r'Entry No|NextSeq|NextNo|NextKey', ahead, re.IGNORECASE):
                    findings.append({
                        "line": i + 1,
                        "snippet": line.strip()[:120],
                        "message": "LockTable + FindLast for sequence generation — use NumberSequence.Next() instead"
                    })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 26 — SetRange on PK + FindFirst instead of Get
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="SETRANGE_FINDSET_FOR_GET",
    group="Data Transfer",
    severity="MEDIUM",
    title="SetRange on PK + FindFirst instead of direct Get()",
    description=('SetRange on a primary key field followed by FindFirst() goes through the filter+scan path instead of the optimized single-row lookup. Get() uses the primary key index directly — no cursor setup, hits the clustered index directly.\n\nSQL IMPACT: SetRange+FindFirst: SELECT TOP 50 ... WHERE \\"No_\\"=X (cursor setup overhead).\nGet(): Direct clustered index point lookup — no cursor. Measurably faster in high-frequency loops.\n\nBAD:  Customer.SetRange(\\"No.\\", CustomerNo); if Customer.FindFirst() then ...\nGOOD: if Customer.Get(CustomerNo) then ...\n\nHINT: Compare SELECT TOP 50 (SetRange+FindFirst) vs direct lookup. Get() hits clustered index directly — 1 read, no cursor.'),
    exercises=[29],
)
class PatternSetRangeFindFirstForGet:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            m = re.search(r'(\w+)\.SetRange\("No\.",\s*\w+\)', line)
            if not m or line.strip().startswith('//'):
                continue
            var = m.group(1)
            ahead = '\n'.join(lines[i:min(len(lines), i+3)])
            if re.search(rf'\b{re.escape(var)}\.FindFirst\(\)', ahead):
                findings.append({
                    "line": i + 1,
                    "snippet": line.strip()[:120],
                    "message": f"'{var}.SetRange(\"No.\", ...) + FindFirst()' — use '{var}.Get(...)' directly"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 27 — Silent Insert failure (if Insert then)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="SILENT_INSERT_FAILURE",
    group="Write Patterns",
    severity="MEDIUM",
    title="'if Record.Insert(false) then' silently swallows duplicate-key errors",
    description=("In AL, Insert(false) does NOT suppress the SQL unique constraint error — it still propagates. Wrapping it in 'if ... then' gives a false sense that the failure is handled. In practice the record silently isn't created and the caller never knows, leading to data integrity gaps.\n\nSQL IMPACT: SQL unique constraint error still raised — 'if then' doesn't catch SQL errors.\nSilent failure → missing records → integrity gap.\n\nBAD:  if Record.Insert(false) then MovementCount += 1;\nGOOD: Record.Insert(false); MovementCount += 1;\n\nHINT: Insert a duplicate key row with 'if Insert then'. Check SQL Profiler — does the error appear? The record is not created but no AL error raised."),
    exercises=[30],
)
class PatternSilentInsertFailure:
    _RE = re.compile(r'if\s+\w+\.Insert\((?:false|true)\)\s+then', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternSilentInsertFailure._RE,
                         lambda m: "Silent Insert — errors won't surface. Use plain Insert() or handle explicitly")

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 28 — LockTable too early (before read-only phase)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="LOCKTABLE_TOO_EARLY",
    group="Locking",
    severity="HIGH",
    title="LockTable() called before read phase — holds write lock during reads",
    description=('LockTable() at the top of a procedure holds an exclusive lock through the entire validation / read phase — which may take seconds on large data. Every other session needing this table is blocked for the full duration. The lock is only needed at the moment of the first write.\n\nSQL IMPACT: X-lock held from top of proc through entire read phase (seconds).\nvs. X-lock acquired just before first Modify (milliseconds).\n\nBAD:  WorkshopData.LockTable(); ... if WorkshopData.FindSet() then [read loop] ...\nGOOD: [read loop without lock] ... WorkshopData.LockTable(); [write phase only]\n\nHINT: Use Activity Monitor or Profiler lock events. LockTable at start: X-lock held during entire read phase. LockTable at write phase: X-lock held for milliseconds only.'),
    exercises=[31, 42],
)
class PatternLockTableTooEarly:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            if re.search(r'\w+\.LockTable\(', line) and not line.strip().startswith('//'):
                # Check if FindSet follows (read phase)
                ahead = '\n'.join(lines[i:min(len(lines), i+15)])
                if re.search(r'\.FindSet\(\)', ahead):
                    findings.append({
                        "line": i + 1,
                        "snippet": line.strip()[:120],
                        "message": "LockTable() before FindSet — move lock closer to the write operation"
                    })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 29 — Missing ReadIsolation (dirty reads safe = ReadUncommitted)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="MISSING_READ_ISOLATION",
    group="Locking",
    severity="MEDIUM",
    title="FindSet on reporting/read-only query without ReadIsolation = ReadUncommitted",
    description=('Read-only analytics FindSet acquires Shared (S) locks on every fetched page. Concurrent warehouse write sessions hold Exclusive (X) locks on same rows. Result: analytics blocks postings, postings block analytics. On a 50 000-row scan, S-locks are held for several seconds.\n\nSQL IMPACT: Default isolation: Shared (S) locks per page fetched.\nReadUncommitted: NO lock acquisition — readers never block writers.\n\nGOOD: WorkshopData.ReadIsolation := IsolationLevel::ReadUncommitted;\n      if WorkshopData.FindSet() then ...\n\nHINT: Without ReadUncommitted: watch S-lock events per page in SQL Profiler. With ReadUncommitted: zero S-lock events — readers invisible. Never use for financial postings or validation.'),
    exercises=[34],
)
class PatternMissingReadIsolation:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        for i, line in enumerate(lines):
            if re.search(r'\w+\.FindSet\(\)', line) and not line.strip().startswith('//'):
                # Procedure name suggests reporting
                context_above = '\n'.join(lines[max(0, i-30):i])
                if re.search(r'Report|Dashboard|Export|Build.*Report|Snapshot', context_above, re.IGNORECASE):
                    if 'ReadIsolation' not in context_above:
                        findings.append({
                            "line": i + 1,
                            "snippet": line.strip()[:120],
                            "message": "Reporting FindSet without ReadIsolation := ReadUncommitted — may block concurrent writes"
                        })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 30 — RecordRef/FieldRef when typed Record is sufficient
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="RECORDREF_WHEN_TYPED_SUFFICIENT",
    group="Memory / Copies",
    severity="LOW",
    title="RecordRef/FieldRef used when a typed Record variable would suffice",
    description=('RecordRef provides late-bound, reflection-based table access. Each Field() call does a dictionary lookup + type boxing. SQL generation is less optimized than for typed Record variables. Benchmarks show 3–5x slower reads than typed Record on same data.\n\nSQL IMPACT: RecordRef: Field() lookup + boxing overhead per field per row.\nTyped Record: direct field access, compiler-optimized SQL.\n\nBAD:  RecRef: RecordRef; RecRef.Open(Database::\\"Workshop Data\\"); RecRef.Field(2).Value := ...;\nGOOD: WorkshopData: Record \\"Workshop Data\\"; WorkshopData.Description := ...;\n\nHINT: Compare RecordRef.Field(2).Value vs typed WorkshopData.Description. Run a 10 000-row loop with each — time the difference. RecordRef is 3–5x slower.'),
    exercises=[35],
)
class PatternRecordRefUnnecessary:
    _RE = re.compile(r'\bRecRef\s*:\s*RecordRef\b|\bFldRef\s*:\s*FieldRef\b', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternRecordRefUnnecessary._RE,
                         lambda m: "RecordRef/FieldRef — consider typed Record variable if table is known at compile time")

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 31 — ModifyAll with RunTrigger=true
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="MODIFYALL_RUNTRIGGER_TRUE",
    group="Bulk Operations",
    severity="HIGH",
    title="ModifyAll with RunTrigger=true fires OnModify trigger per row",
    description=('ModifyAll() with RunTrigger=true checks for OnAfterModify subscribers. If ANY subscriber is bound, ModifyAll falls back to N individual Modify() calls — one per record — each triggering the subscriber. 10 000 records × 1 Modify() call = 10 000 SQL UPDATE round-trips.\n\nSQL IMPACT: With RunTrigger=true + active subscriber: N × UPDATE per row.\nWith RunTrigger=false: 1 × UPDATE ... WHERE ... (single SQL statement).\n\nBAD:  Record.ModifyAll(Field, Value, true);\nGOOD: Record.ModifyAll(Field, Value, false);\n\nHINT: Bind the subscriber and run ModifyAll with RunTrigger=true. SQL Profiler: count UPDATE statements — should be N rows. Change to RunTrigger=false: now count is 1 UPDATE statement.'),
    exercises=[37],
)
class PatternModifyAllRunTrigger:
    _RE = re.compile(r'\w+\.ModifyAll\([^)]+,\s*true\)', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternModifyAllRunTrigger._RE,
                         lambda m: "ModifyAll with RunTrigger=true fires OnModify per row — use false unless required")

    @staticmethod
    def fix(text: str) -> str:
        return re.sub(
            r'(\w+\.ModifyAll\([^)]+,\s*)true(\))',
            r'\1false\2',
            text
        )


# ───────────────────────────────────────────────────────────────────────
# PATTERN 32 — Missing Database.SelectLatestVersion in multi-pass loop
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="MISSING_SELECTLATESTVERSION",
    group="Stale Reads",
    severity="MEDIUM",
    title="Multi-pass read loop without Database.SelectLatestVersion()",
    description=('BC NST caches SQL query results in-session. Repeated FindSet calls with the same filter return CACHED rows — no SQL executed after pass 1. A multi-pass pipeline reading the same filter silently returns stale data from pass 1 for passes 2–N if data changed concurrently.\n\nSQL IMPACT: Pass 1: SELECT ... (real SQL).\nPass 2–N: [NST cache hit] → no SQL, no awareness of concurrent updates.\n\nGOOD: foreach Pass in Passes do begin\n          Database.SelectLatestVersion(); // Flushes non-locked session cache\n          if Record.FindSet() then ...\n\nHINT: Run the pipeline twice: with and without SelectLatestVersion. Without flush: 0 SQL queries for passes 2–N (cache hit — stale data).'),
    exercises=[38],
)
class PatternMissingSelectLatestVersion:
    @staticmethod
    def detect(text: str) -> list[dict]:
        return []  # Too context-specific; covered by FIX comment detection

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 33 — OR chain instead of case true of (3+ conditions)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="OR_CHAIN_USE_CASE_TRUE",
    group="Short-Circuit Evaluation",
    severity="MEDIUM",
    title="3+ OR conditions — use 'case true of' for short-circuit evaluation",
    description=('AL evaluates ALL operands of or before returning — even if the first operand is already true. Three expensive eligibility checks joined with or each execute a CalcSums or FindSet query — all three, every time.\n\nSQL IMPACT: 3 SQL queries per customer: CalcSums + IsEmpty + Count.\nEven when the first check already returns true — wasted 2 queries.\ncase true of with comma-separated conditions short-circuits at first true.\n\nBAD:  if IsOverCreditLimit(No) or HasBlockedItems(No) or HasOverdueInvoices(No) then ...\nGOOD: case true of\n          IsOverCreditLimit(No), HasBlockedItems(No), HasOverdueInvoices(No):\n              exit(false);\n      end;\n\nHINT: Add a counter inside each validation function. With or: all three counters increment for every customer. With case true of: only 1–2 counters increment when first is true.'),
    exercises=[39],
)
class PatternOrChainCaseTrue:
    _RE = re.compile(r'\bif\b[^;]+\bor\b[^;]+\bor\b[^;]+\bthen\b', re.MULTILINE | re.IGNORECASE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        for m in PatternOrChainCaseTrue._RE.finditer(text):
            line = _find_line(text, m.start())
            line_text = text.splitlines()[line-1].strip()
            if line_text.startswith('//'):
                continue
            # Count function calls in the OR chain
            if len(re.findall(r'\w+\(', m.group(0))) >= 3:
                findings.append({
                    "line": line,
                    "snippet": m.group(0)[:120],
                    "message": "3+ OR conditions with function calls — use 'case true of' for short-circuit"
                })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 34 — LockTable + ReadIsolation UpdLock (Ex42)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="LOCKTABLE_USE_UPDLOCK",
    group="Locking",
    severity="MEDIUM",
    title="LockTable() — consider ReadIsolation := UpdLock + FindSet(true) instead",
    description=('LockTable() acquires a table-level Exclusive (X) lock on the ENTIRE table. Every concurrent session — reads, analytics, order entry — blocks for the full transaction duration. A batch updating 1 000 rows can block all other sessions for seconds.\n\nSQL IMPACT: LockTable: X-lock on entire table — held for full transaction.\nReadIsolation := UpdLock + FindSet(true): acquires update locks only on rows actually read, allowing concurrent readers.\n\nBAD:  Record.LockTable();\n      if Record.FindSet() then\nGOOD: Record.ReadIsolation := IsolationLevel::UpdLock;\n      if Record.FindSet(true) then\n\nHINT: Open two BC sessions simultaneously. Session 1: run LockTable. Session 2: try any read — it blocks until Session 1 commits. With UpdLock: Session 2 reads freely.'),
    exercises=[42],
)
class PatternLockTableUseUpdLock:
    _RE = re.compile(r'(\w+)\.LockTable\(\)', re.MULTILINE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternLockTableUseUpdLock._RE,
                         lambda m: f"Consider replacing '{m.group(1)}.LockTable()' with ReadIsolation := UpdLock + FindSet(true)")

    @staticmethod
    def fix(text: str) -> str:
        def replace(m):
            var = m.group(1)
            pos = m.end()
            ahead = text[pos:pos+200]
            if re.search(rf'\b{re.escape(var)}\.FindSet\(\)', ahead):
                replacement = f'{var}.ReadIsolation := IsolationLevel::UpdLock'
                # Also fix the FindSet in one pass
                return replacement
            return m.group(0)
        result = PatternLockTableUseUpdLock._RE.sub(replace, text)
        result = re.sub(r'(\w+)\.ReadIsolation := IsolationLevel::UpdLock;\s*\n(\s+)if \1\.FindSet\(\)',
                        r'\1.ReadIsolation := IsolationLevel::UpdLock;\n\2if \1.FindSet(true)', result)
        return result


# ───────────────────────────────────────────────────────────────────────
# PATTERN 35 — true in [...] condition order (cheapest first)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="CONDITION_ORDER_TRUE_IN",
    group="Short-Circuit Evaluation",
    severity="LOW",
    title="'if true in [...]' — put cheapest condition first for best short-circuit",
    description=("AL's in [...] operator DOES short-circuit — unlike or/\x07nd. But placing the most expensive check FIRST defeats the benefit: the CalcSums fires before the cheap blacklist Get() is even tested. Rule: always order conditions cheapest-first in in [...] lists.\n\nSQL IMPACT: Expensive-first: CalcSums runs for ~100% of customers.\nCheap-first: CalcSums skipped for the ~35% caught by cheaper checks first.\n\nBAD:  if true in [HasExceededAnnualBudget(No), IsBlacklisted(No)] then ...\nGOOD: if true in [IsBlacklisted(No), HasExceededAnnualBudget(No)] then ...\n\nHINT: Add a Message() counter inside HasExceededAnnualBudget. Run with expensive-first: counter = total customer count. Reorder to cheap-first: counter drops by ~35%."),
    exercises=[44],
)
class PatternConditionOrderTrueIn:
    _RE = re.compile(r'if true in \[', re.MULTILINE | re.IGNORECASE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(text, PatternConditionOrderTrueIn._RE,
                         lambda m: "Review condition order: put cheapest check first for best short-circuit performance")

    @staticmethod
    def fix(text: str) -> str:
        return text


# ───────────────────────────────────────────────────────────────────────
# PATTERN 36 — N+1 nested FindSet inside repeat..until loop (Ex 27 / 43)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="NESTED_FINDSET_N_PLUS_ONE",
    group="Data Transfer",
    severity="HIGH",
    title="Nested FindSet/FindFirst inside repeat..until loop (N+1 queries)",
    description=(
        "For each row in the outer FindSet, an inner FindSet on a different variable fires a new SQL query. "
        "With 1 000 outer items: 1 outer SELECT + 1 000 inner SELECTs = 1 001 SQL round-trips. "
        "A Query object with GROUP BY does the same work in a single SQL query.\n\n"
        "SQL IMPACT: 1 000 items × 1 inner query = 1 001 total SQL round-trips.\n"
        "Query object: 1 SQL query with GROUP BY — result set = N groups only.\n\n"
        "BAD:  if Items.FindSet() then repeat\n"
        "          SalesLines.SetRange(\"No.\", Items.\"No.\");\n"
        "          if SalesLines.FindSet() then repeat ... until SalesLines.Next() = 0;\n"
        "      until Items.Next() = 0;\n"
        "GOOD: var AnalysisQuery: Query \"Workshop Item Analysis\";\n"
        "      if AnalysisQuery.Open() then\n"
        "          while AnalysisQuery.Read() do ...\n\n"
        "HINT: Count SQL queries in Profiler for the nested loop. Each outer row fires 1 inner SQL query. "
        "Query object version: 1 SQL query with GROUP BY regardless of data volume."
    ),
    exercises=[27, 43],
)
class PatternNestedFindSetNPlusOne:
    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        lines = text.splitlines()
        outer_var: str | None = None
        in_loop = False

        for i, line in enumerate(lines):
            stripped = line.strip()
            if stripped.startswith('//'):
                continue

            # Track outer FindSet before a repeat
            m_outer = re.search(r'(\w+)\.(FindSet|FindFirst)\(', line)
            if m_outer and not in_loop:
                outer_var = m_outer.group(1)

            if re.match(r'^repeat\b', stripped, re.IGNORECASE) and outer_var:
                in_loop = True

            if in_loop:
                m_inner = re.search(r'(\w+)\.(FindSet|FindFirst)\(', line)
                if m_inner and m_inner.group(1) != outer_var:
                    findings.append({
                        "line": i + 1,
                        "snippet": line.strip()[:120],
                        "message": (
                            f"Nested {m_inner.group(2)}() on '{m_inner.group(1)}' inside outer "
                            f"'{outer_var}' FindSet loop — N+1 SQL queries. "
                            "Consider a Query object with GROUP BY."
                        ),
                    })

            if re.match(r'^until\s+\w+\.Next\(\)', stripped, re.IGNORECASE):
                in_loop = False
                outer_var = None

        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text  # Structural change required — no auto-fix


# ───────────────────────────────────────────────────────────────────────
# PATTERN 37 — AutoIncrement = true disables SQL batch INSERT (Ex 36)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="AUTOINCREMENT_DISABLES_BULK_INSERT",
    group="Bulk Operations",
    severity="HIGH",
    title="AutoIncrement = true on PK disables SQL batch INSERT",
    description=(
        "SQL Server IDENTITY (AutoIncrement = true) requires SCOPE_IDENTITY() to be returned "
        "after each INSERT — this prevents batch INSERT entirely. "
        "For 10 000 count sheet lines: 10 000 individual SQL INSERTs, one per row. "
        "Manual PK assignment via NumberSequence allows SQL Server to batch rows into one trip.\n\n"
        "SQL IMPACT: AutoIncrement: 10 000 × INSERT (+ SCOPE_IDENTITY per row).\n"
        "Manual PK with NumberSequence: ~10 batch INSERT statements — orders of magnitude faster.\n\n"
        "BAD:  field(1; Id; Integer) { AutoIncrement = true; }\n"
        "GOOD: field(1; Id; Integer) { }\n"
        "      // In code:\n"
        "      Entry.Id := NumberSequence.Next('WS_COUNT_SEQ');\n"
        "      Entry.Insert(false); // Batchable — no identity return needed\n\n"
        "HINT: Insert 10 000 rows into both tables in SQL Profiler. "
        "AutoIncrement table: 10 000 individual INSERT statements. "
        "Manual key table: ~10 batch INSERT statements total."
    ),
    exercises=[36],
)
class PatternAutoIncrementBulkInsert:
    _RE = re.compile(r'AutoIncrement\s*=\s*true', re.IGNORECASE)

    @staticmethod
    def detect(text: str) -> list[dict]:
        return _findings(
            text,
            PatternAutoIncrementBulkInsert._RE,
            lambda m: (
                "AutoIncrement = true requires SCOPE_IDENTITY() per INSERT — prevents SQL batch inserts. "
                "Remove AutoIncrement and use NumberSequence.Next() for PK assignment."
            ),
        )

    @staticmethod
    def fix(text: str) -> str:
        return text  # Requires table redesign + code change — no auto-fix


# ───────────────────────────────────────────────────────────────────────
# PATTERN 38 — AL-side GROUP BY aggregation (Ex 43)
# ───────────────────────────────────────────────────────────────────────
@_register(
    id="AL_SIDE_AGGREGATION",
    group="Aggregation",
    severity="HIGH",
    title="AL-side GROUP BY aggregation — push to SQL with a Query object",
    description=(
        "Manual AL aggregation: FindSet fetches ALL rows into NST, accumulates sums per group in AL. "
        "For 100 000 entries — 100 000 rows transferred to NST memory. "
        "A Query object with Method = Sum pushes GROUP BY and SUM() to SQL Server. "
        "SQL returns only N rows (one per group) — 99 990 rows never leave the database.\n\n"
        "SQL IMPACT: AL loop:  SELECT all 100 000 rows, SUM in NST memory.\n"
        "Query:     SELECT Location, SUM(Amount) GROUP BY Location → 10 rows only.\n\n"
        "BAD:  if WorkshopData.FindSet() then repeat\n"
        "          TotalByLocation.Add(WorkshopData.\"Location Code\", WorkshopData.Amount);\n"
        "      until WorkshopData.Next() = 0;\n"
        "GOOD: var RevenueQuery: Query \"WS Location Revenue\";\n"
        "      if RevenueQuery.Open() then\n"
        "          while RevenueQuery.Read() do\n"
        "              ProcessSummary(RevenueQuery.Location_Code, RevenueQuery.Sum_Line_Amount);\n\n"
        "HINT: Run the manual loop on 50 000 rows. Check SQL Profiler: count SELECT rows returned. "
        "Then switch to the Query version. Profiler shows 1 query returning only N rows. "
        "Duration difference is dramatic at scale."
    ),
    exercises=[43],
)
class PatternAlSideAggregation:
    # Detect FindSet loop that accumulates into a Dictionary by group key
    _RE = re.compile(
        r'FindSet\s*\([^)]*\).*?repeat.*?\.Add\s*\(',
        re.IGNORECASE | re.DOTALL,
    )

    @staticmethod
    def detect(text: str) -> list[dict]:
        findings = []
        for m in PatternAlSideAggregation._RE.finditer(text):
            line = _find_line(text, m.start())
            snippet = text[m.start(): m.start() + 80].split('\n')[0].strip()
            findings.append({
                "line": line,
                "message": (
                    "AL-side GROUP BY aggregation — fetches all rows to NST. "
                    "Use a Query object with Method = Sum to push GROUP BY to SQL Server."
                ),
                "snippet": snippet,
            })
        return findings

    @staticmethod
    def fix(text: str) -> str:
        return text  # Structural change required — no auto-fix


# ───────────────────────────────────────────────────────────────────────
# Utility helpers
# ───────────────────────────────────────────────────────────────────────

def _scan_file(path: Path) -> list[dict]:
    """Run all detectors on a single AL file. Returns list of finding dicts."""
    try:
        text = path.read_text(encoding='utf-8-sig')
    except Exception as e:
        return [{"pattern": "READ_ERROR", "file": str(path), "line": 0, "snippet": str(e), "message": "Could not read file"}]

    findings = []
    for p in PATTERNS:
        for f in p["detector"](text):
            findings.append({
                "pattern": p["id"],
                "severity": p["severity"],
                "title": p["title"],
                "file": str(path),
                **f
            })
    return findings


def _fix_file(path: Path) -> tuple[str, list[str]]:
    """Apply all fixers to a single AL file. Returns (new_text, list_of_applied_fixes)."""
    try:
        text = path.read_text(encoding='utf-8-sig')
    except Exception as e:
        return "", [f"READ_ERROR: {e}"]

    applied = []
    original = text
    for p in PATTERNS:
        new_text = p["fixer"](text)
        if new_text != text:
            applied.append(p["id"])
            text = new_text

    return text, applied


def _al_files(folder: Path) -> list[Path]:
    return sorted(folder.rglob("*.al"))


# ───────────────────────────────────────────────────────────────────────
# MCP Tools
# ───────────────────────────────────────────────────────────────────────

@mcp.tool()
def list_patterns() -> str:
    """
    List all known AL performance anti-patterns with IDs, severity, and short descriptions.
    Use this to understand what the analyzer can detect before running a scan.
    """
    lines = ["# AL Performance Patterns\n"]
    groups: dict[str, list] = {}
    for p in PATTERNS:
        groups.setdefault(p["group"], []).append(p)

    for group, items in sorted(groups.items()):
        lines.append(f"\n## {group}\n")
        for p in items:
            lines.append(f"- **[{p['severity']}]** `{p['id']}`  \n  {p['title']}  \n  Exercises: {p['exercises']}\n")

    return "\n".join(lines)


@mcp.tool()
def explain_pattern(pattern_id: str) -> str:
    """
    Get a full explanation of a specific performance pattern including examples and the fix.

    Args:
        pattern_id: The pattern ID (e.g. 'MISSING_SETLOADFIELDS'). Use list_patterns() to see all IDs.
    """
    for p in PATTERNS:
        if p["id"].upper() == pattern_id.upper():
            return (
                f"# {p['title']}\n\n"
                f"**ID:** `{p['id']}`  \n"
                f"**Severity:** {p['severity']}  \n"
                f"**Category:** {p['group']}  \n"
                f"**Workshop Exercises:** {p['exercises']}\n\n"
                f"{p['description']}"
            )
    ids = ", ".join(p["id"] for p in PATTERNS)
    return f"Pattern '{pattern_id}' not found. Known IDs: {ids}"


@mcp.tool()
def scan_al_workspace(
    folder_path: str,
    severity_filter: str = "ALL",
    group_filter: str = "ALL",
) -> str:
    """
    Scan all AL files in a folder (recursively) for performance anti-patterns.
    Returns a structured report of findings grouped by file.

    Args:
        folder_path: Absolute path to the folder containing AL source files.
        severity_filter: Filter by severity: HIGH, MEDIUM, LOW, or ALL (default ALL).
        group_filter: Filter by pattern group name or ALL (default ALL).
    """
    folder = Path(folder_path)
    if not folder.exists():
        return f"ERROR: Folder not found: {folder_path}"

    files = _al_files(folder)
    if not files:
        return f"No .al files found in {folder_path}"

    all_findings: list[dict] = []
    for f in files:
        all_findings.extend(_scan_file(f))

    # Apply filters
    if severity_filter.upper() != "ALL":
        all_findings = [f for f in all_findings if f["severity"].upper() == severity_filter.upper()]
    if group_filter.upper() != "ALL":
        all_findings = [f for f in all_findings if
                        any(p["group"].upper() == group_filter.upper()
                            for p in PATTERNS if p["id"] == f["pattern"])]

    if not all_findings:
        return f"✅ No issues found ({len(files)} files scanned)."

    # Group by file
    by_file: dict[str, list] = {}
    for f in all_findings:
        by_file.setdefault(f["file"], []).append(f)

    severity_order = {"HIGH": 0, "MEDIUM": 1, "LOW": 2}
    total = len(all_findings)
    high = sum(1 for f in all_findings if f["severity"] == "HIGH")
    medium = sum(1 for f in all_findings if f["severity"] == "MEDIUM")
    low = sum(1 for f in all_findings if f["severity"] == "LOW")

    lines = [
        f"# AL Performance Scan Results\n",
        f"**Folder:** `{folder_path}`  ",
        f"**Files scanned:** {len(files)}  ",
        f"**Issues found:** {total} ({high} HIGH, {medium} MEDIUM, {low} LOW)\n",
    ]

    for filepath, findings in sorted(by_file.items()):
        rel = Path(filepath).relative_to(folder) if Path(filepath).is_relative_to(folder) else Path(filepath).name
        lines.append(f"\n## `{rel}`\n")
        findings_sorted = sorted(findings, key=lambda x: severity_order.get(x["severity"], 9))
        for f in findings_sorted:
            sev_icon = {"HIGH": "🔴", "MEDIUM": "🟡", "LOW": "🔵"}.get(f["severity"], "⚪")
            lines.append(f"- {sev_icon} **L{f['line']}** `{f['pattern']}`: {f['message']}")
            if f.get("snippet"):
                lines.append(f"  ```al\n  {f['snippet']}\n  ```")

    return "\n".join(lines)


@mcp.tool()
def fix_al_file(
    file_path: str,
    dry_run: bool = True,
) -> str:
    """
    Apply all available automatic fixes to a single AL file.

    Args:
        file_path: Absolute path to the .al file to fix.
        dry_run: If True (default), show what would change without writing. Set False to write.
    """
    path = Path(file_path)
    if not path.exists():
        return f"ERROR: File not found: {file_path}"

    original = path.read_text(encoding='utf-8-sig')
    new_text, applied = _fix_file(path)

    if not applied:
        return f"✅ No automatic fixes applicable to `{path.name}`."

    lines = [f"# Fix Report: `{path.name}`\n"]
    lines.append(f"**Fixes applied:** {', '.join(applied)}\n")

    if dry_run:
        lines.append("**Mode:** DRY RUN — no file written. Set dry_run=False to apply.\n")
        # Show diff summary
        orig_lines = original.splitlines()
        new_lines = new_text.splitlines()
        changes = 0
        for i, (o, n) in enumerate(zip(orig_lines, new_lines)):
            if o != n:
                lines.append(f"L{i+1}: `{o.strip()}` → `{n.strip()}`")
                changes += 1
                if changes >= 20:
                    lines.append(f"... (and more)")
                    break
    else:
        path.write_text(new_text, encoding='utf-8-sig')
        lines.append(f"✅ File written: `{file_path}`")

    return "\n".join(lines)


@mcp.tool()
def fix_al_workspace(
    folder_path: str,
    dry_run: bool = True,
) -> str:
    """
    Apply all available automatic fixes to every AL file in a folder (recursively).

    Args:
        folder_path: Absolute path to the folder containing AL source files.
        dry_run: If True (default), show what would change without writing. Set False to write.
    """
    folder = Path(folder_path)
    if not folder.exists():
        return f"ERROR: Folder not found: {folder_path}"

    files = _al_files(folder)
    if not files:
        return f"No .al files found in {folder_path}"

    results = []
    total_fixes = 0
    for f in files:
        original = f.read_text(encoding='utf-8-sig')
        new_text, applied = _fix_file(f)
        if applied:
            total_fixes += len(applied)
            results.append((f, applied, original != new_text))
            if not dry_run and original != new_text:
                f.write_text(new_text, encoding='utf-8-sig')

    if not results:
        return f"✅ No automatic fixes applicable in {len(files)} files."

    mode = "DRY RUN" if dry_run else "APPLIED"
    lines = [
        f"# Fix Workspace Report [{mode}]\n",
        f"**Folder:** `{folder_path}`  ",
        f"**Files with fixes:** {len(results)} of {len(files)}  ",
        f"**Total fix operations:** {total_fixes}\n",
    ]

    for f, applied, changed in results:
        rel = f.relative_to(folder) if f.is_relative_to(folder) else f.name
        status = "✅ written" if (not dry_run and changed) else ("📝 would change" if changed else "⟳ no change")
        lines.append(f"- `{rel}` [{status}]: {', '.join(applied)}")

    if dry_run:
        lines.append("\n> Set `dry_run=False` to apply all changes.")

    return "\n".join(lines)


@mcp.tool()
def scan_al_code(
    al_code: str,
    file_hint: str = "inline",
) -> str:
    """
    Scan a snippet of AL code (pasted inline) for performance issues.
    Useful for checking code before committing or during code review.

    Args:
        al_code: The AL code text to analyze.
        file_hint: Optional label for the code (e.g. the procedure name).
    """
    findings: list[dict] = []
    for p in PATTERNS:
        for f in p["detector"](al_code):
            findings.append({
                "pattern": p["id"],
                "severity": p["severity"],
                "title": p["title"],
                "file": file_hint,
                **f
            })

    if not findings:
        return "✅ No performance issues detected in the provided code."

    severity_order = {"HIGH": 0, "MEDIUM": 1, "LOW": 2}
    findings_sorted = sorted(findings, key=lambda x: severity_order.get(x["severity"], 9))

    lines = [f"# Performance Issues in `{file_hint}`\n"]
    for f in findings_sorted:
        sev_icon = {"HIGH": "🔴", "MEDIUM": "🟡", "LOW": "🔵"}.get(f["severity"], "⚪")
        lines.append(f"{sev_icon} **L{f['line']}** `{f['pattern']}` — {f['message']}")
        lines.append(f"  > {f['title']}")
        if f.get("snippet"):
            lines.append(f"  ```al\n  {f['snippet']}\n  ```")
        lines.append("")

    return "\n".join(lines)


# ═══════════════════════════════════════════════════════════════════════
# ORCHESTRATION LAYER
# ═══════════════════════════════════════════════════════════════════════
#
# Architecture:
#   analyze_al_performance(folder)          ← master orchestrator
#       internally delegates to one function per pattern group (sub-agents)
#       aggregates all results into a unified priority report
#
#   Individual group sub-agent tools also exposed so the LLM can call
#   them independently when the user asks about a specific category.
#
# ═══════════════════════════════════════════════════════════════════════

# ─── Internal sub-agent runner ────────────────────────────────────────

def _run_group_agent(group_name: str, folder: Path) -> dict:
    """
    Run all detectors belonging to a single pattern group against every AL file.
    Returns a structured result dict — this is what each sub-agent produces.
    """
    group_patterns = [p for p in PATTERNS if p["group"] == group_name]
    files = _al_files(folder)

    findings: list[dict] = []
    for f in files:
        try:
            text = f.read_text(encoding="utf-8-sig")
        except Exception:
            continue
        for p in group_patterns:
            for finding in p["detector"](text):
                findings.append({
                    "pattern": p["id"],
                    "severity": p["severity"],
                    "title": p["title"],
                    "file": str(f),
                    "rel_file": str(f.relative_to(folder)) if f.is_relative_to(folder) else f.name,
                    **finding
                })

    high   = [f for f in findings if f["severity"] == "HIGH"]
    medium = [f for f in findings if f["severity"] == "MEDIUM"]
    low    = [f for f in findings if f["severity"] == "LOW"]

    # Auto-fixable patterns in this group
    fixable = [p["id"] for p in group_patterns if _is_pattern_auto_fixable(p["id"])]

    return {
        "group": group_name,
        "patterns_checked": [p["id"] for p in group_patterns],
        "files_scanned": len(files),
        "total": len(findings),
        "high": len(high),
        "medium": len(medium),
        "low": len(low),
        "fixable_patterns": fixable,
        "findings": findings,
    }


_AUTO_FIXABLE = {
    "FIND_DASH_BUFFER_ONE",
    "COUNT_NOT_ZERO",
    "COUNT_EQUALS_ONE",
    "ISEMPTY_BEFORE_FINDSET",
    "FINDSET_BEFORE_MODIFYALL",
    "FINDSET_BEFORE_DELETEALL",
    "MODIFYALL_RUNTRIGGER_TRUE",
    "MISSING_TEMPORARY",
    "FINDSET_MODIFY_NO_TRUE",
    "LOCKTABLE_USE_UPDLOCK",
    "FINDFIRST_IN_LOOP",
}

def _is_pattern_auto_fixable(pattern_id: str) -> bool:
    return pattern_id in _AUTO_FIXABLE


def _format_group_report(result: dict, folder: Path, detail_level: str = "summary") -> list[str]:
    """Render one group sub-agent result as markdown lines."""
    sev_icon = "🔴" if result["high"] > 0 else ("🟡" if result["medium"] > 0 else "✅")
    lines = [
        f"\n### {sev_icon} {result['group']}",
        f"Found **{result['total']}** issue(s) — "
        f"{result['high']} HIGH, {result['medium']} MEDIUM, {result['low']} LOW",
    ]
    if result["fixable_patterns"]:
        lines.append(f"Auto-fixable patterns: `{'`, `'.join(result['fixable_patterns'])}`")

    if detail_level != "full" or result["total"] == 0:
        return lines

    severity_order = {"HIGH": 0, "MEDIUM": 1, "LOW": 2}
    findings_sorted = sorted(result["findings"], key=lambda x: severity_order.get(x["severity"], 9))
    seen: set[str] = set()
    for f in findings_sorted[:15]:  # cap per group
        key = f"{f['rel_file']}:{f['line']}:{f['pattern']}"
        if key in seen:
            continue
        seen.add(key)
        icon = {"HIGH": "🔴", "MEDIUM": "🟡", "LOW": "🔵"}.get(f["severity"], "⚪")
        lines.append(f"  - {icon} `{f['rel_file']}` L{f['line']} `{f['pattern']}`: {f['message']}")
    if len(result["findings"]) > 15:
        lines.append(f"  - _(… {len(result['findings']) - 15} more — use group sub-agent for full list)_")
    return lines


# ─── Group sub-agent tools ────────────────────────────────────────────
# Each exposed as its own MCP tool so the LLM can call them independently.

def _group_tool_impl(group_name: str, folder_path: str) -> str:
    folder = Path(folder_path)
    if not folder.exists():
        return f"ERROR: Folder not found: {folder_path}"
    result = _run_group_agent(group_name, folder)
    lines = [f"# Sub-Agent: {group_name}\n",
             f"**Folder:** `{folder_path}`  ",
             f"**Issues:** {result['total']} ({result['high']} HIGH, {result['medium']} MEDIUM, {result['low']} LOW)\n"]
    lines += _format_group_report(result, folder, detail_level="full")
    return "\n".join(lines)


@mcp.tool()
def scan_data_transfer_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Data Transfer anti-patterns.
    Covers: missing SetLoadFields, Find('-') buffer-size-1, FindFirst in loops, FindLast in loops,
    SetRange+FindFirst instead of Get, SetCurrentKey missing.
    """
    return _group_tool_impl("Data Transfer", folder_path)


@mcp.tool()
def scan_flowfield_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for FlowField anti-patterns.
    Covers: CalcFields inside loops, SetFilter on FlowField (correlated subquery).
    """
    return _group_tool_impl("FlowFields", folder_path)


@mcp.tool()
def scan_aggregation_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Aggregation anti-patterns.
    Covers: manual summation loops that should use CalcSums().
    """
    return _group_tool_impl("Aggregation", folder_path)


@mcp.tool()
def scan_bulk_operation_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Bulk Operation anti-patterns.
    Covers: Delete in loop, FindSet before ModifyAll, FindSet before DeleteAll,
    ModifyAll with RunTrigger=true.
    """
    return _group_tool_impl("Bulk Operations", folder_path)


@mcp.tool()
def scan_existence_check_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Existence Check anti-patterns.
    Covers: Count() != 0 vs IsEmpty(), redundant IsEmpty before FindSet, Count() = 1 uniqueness.
    """
    return _group_tool_impl("Existence Checks", folder_path)


@mcp.tool()
def scan_locking_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Locking anti-patterns.
    Covers: LockTable too early, LockTable for sequence generation, DeleteAll without IsEmpty guard,
    LockTable vs ReadIsolation UpdLock.
    """
    return _group_tool_impl("Locking", folder_path)


@mcp.tool()
def scan_memory_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Memory / Copy anti-patterns.
    Covers: Record parameter by value, missing 'temporary' keyword, temp table used as Dictionary,
    temp table used as collection, RecordRef when typed Record suffices.
    """
    return _group_tool_impl("Memory / Copies", folder_path)


@mcp.tool()
def scan_short_circuit_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Short-Circuit Evaluation anti-patterns.
    Covers: OR/AND eager evaluation, 3+ OR conditions (use case true of),
    'if true in [...]' condition ordering.
    """
    return _group_tool_impl("Short-Circuit Evaluation", folder_path)


@mcp.tool()
def scan_write_pattern_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Write Pattern anti-patterns.
    Covers: Insert-on-conflict (try Insert, Modify on fail), silent Insert failure.
    """
    return _group_tool_impl("Write Patterns", folder_path)


@mcp.tool()
def scan_cursor_safety_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Cursor Safety anti-patterns.
    Covers: SetRange/SetFilter on active FindSet cursor (corrupts iteration),
    FindSet(true) missing when Modify is called on cursor variable.
    """
    # Combine Cursor Safety + the FindSet(true) pattern
    return _group_tool_impl("Cursor Safety", folder_path)


@mcp.tool()
def scan_stale_read_issues(folder_path: str) -> str:
    """
    Sub-agent: Scan for Stale Read anti-patterns.
    Covers: missing ReadIsolation on reporting queries, missing SelectLatestVersion in multi-pass loops.
    """
    return _group_tool_impl("Stale Reads", folder_path)


# ─── Master orchestrator tool ─────────────────────────────────────────

@mcp.tool()
def analyze_al_performance(
    folder_path: str,
    include_action_plan: bool = True,
) -> str:
    """
    MASTER ORCHESTRATOR — runs all pattern-group sub-agents in sequence and produces
    a unified performance report with a prioritized action plan.

    This is the primary entry point. It:
      1. Delegates to each pattern-group sub-agent (Data Transfer, FlowFields, Locking, etc.)
      2. Aggregates all findings across all groups
      3. Ranks files by total issue severity score
      4. Produces a prioritized action plan: which files to fix first and how
      5. Lists all auto-fixable patterns with the fix command to run

    Args:
        folder_path: Absolute path to the AL workspace folder to analyze.
        include_action_plan: Include the prioritized fix plan (default True).
    """
    folder = Path(folder_path)
    if not folder.exists():
        return f"ERROR: Folder not found: {folder_path}"

    files = _al_files(folder)
    if not files:
        return f"No .al files found in {folder_path}"

    # ── Step 1: Collect all unique group names from the pattern registry ──
    all_groups = sorted({p["group"] for p in PATTERNS})

    # ── Step 2: Run each group sub-agent ──────────────────────────────────
    group_results: list[dict] = []
    for group in all_groups:
        result = _run_group_agent(group, folder)
        group_results.append(result)

    # ── Step 3: Aggregate ─────────────────────────────────────────────────
    all_findings: list[dict] = []
    for r in group_results:
        all_findings.extend(r["findings"])

    total   = len(all_findings)
    high    = sum(1 for f in all_findings if f["severity"] == "HIGH")
    medium  = sum(1 for f in all_findings if f["severity"] == "MEDIUM")
    low     = sum(1 for f in all_findings if f["severity"] == "LOW")
    score   = high * 10 + medium * 3 + low  # weighted severity score

    # Files ranked by severity score
    file_scores: dict[str, dict] = {}
    for f in all_findings:
        fp = f["file"]
        if fp not in file_scores:
            file_scores[fp] = {"high": 0, "medium": 0, "low": 0, "patterns": set(), "rel": f["rel_file"]}
        file_scores[fp][f["severity"].lower()] += 1
        file_scores[fp]["patterns"].add(f["pattern"])

    ranked_files = sorted(
        file_scores.items(),
        key=lambda x: x[1]["high"] * 10 + x[1]["medium"] * 3 + x[1]["low"],
        reverse=True
    )

    # Auto-fixable findings
    fixable_findings = [f for f in all_findings if _is_pattern_auto_fixable(f["pattern"])]
    fixable_count = len(fixable_findings)
    fixable_files = sorted({f["rel_file"] for f in fixable_findings})

    # ── Step 4: Build report ──────────────────────────────────────────────
    lines = [
        "# 🔍 AL Performance Analysis — Orchestrator Report\n",
        f"**Workspace:** `{folder_path}`  ",
        f"**Files scanned:** {len(files)}  ",
        f"**Total issues:** {total} (🔴 {high} HIGH, 🟡 {medium} MEDIUM, 🔵 {low} LOW)  ",
        f"**Severity score:** {score}  ",
        f"**Auto-fixable:** {fixable_count} issues in {len(fixable_files)} files\n",
        "---\n",
        "## Sub-Agent Results by Group\n",
        "| Group | HIGH | MED | LOW | Total |",
        "|-------|------|-----|-----|-------|",
    ]
    for r in group_results:
        status = "🔴" if r["high"] > 0 else ("🟡" if r["medium"] > 0 else "✅")
        lines.append(f"| {status} {r['group']} | {r['high']} | {r['medium']} | {r['low']} | {r['total']} |")

    # ── Top offending files ───────────────────────────────────────────────
    lines += ["\n---\n", "## 🏆 Files Ranked by Severity Score\n"]
    for i, (fp, sc) in enumerate(ranked_files[:10], 1):
        file_score = sc["high"] * 10 + sc["medium"] * 3 + sc["low"]
        patterns_str = ", ".join(f"`{p}`" for p in sorted(sc["patterns"]))
        lines.append(
            f"{i}. **`{sc['rel']}`** — score {file_score} "
            f"(🔴{sc['high']} 🟡{sc['medium']} 🔵{sc['low']})  \n"
            f"   Patterns: {patterns_str}"
        )
    if len(ranked_files) > 10:
        lines.append(f"\n_… and {len(ranked_files) - 10} more files with issues._")

    # ── Action plan ───────────────────────────────────────────────────────
    if include_action_plan:
        lines += ["\n---\n", "## 📋 Prioritized Action Plan\n"]

        # Phase 1: Auto-fixable
        if fixable_findings:
            lines.append("### Phase 1 — Run Automatic Fixes (zero manual effort)")
            lines.append(f"These {fixable_count} issues can be fixed instantly with `fix_al_workspace`:")
            for pid in sorted(_AUTO_FIXABLE):
                count = sum(1 for f in all_findings if f["pattern"] == pid)
                if count > 0:
                    title = next((p["title"] for p in PATTERNS if p["id"] == pid), pid)
                    lines.append(f"  - `{pid}` × {count} — {title}")
            lines.append(f"\n> **Run:** `fix_al_workspace(\"{folder_path}\", dry_run=False)`")

        # Phase 2: High severity manual fixes
        high_manual = [f for f in all_findings if f["severity"] == "HIGH" and not _is_pattern_auto_fixable(f["pattern"])]
        if high_manual:
            lines.append("\n### Phase 2 — High Severity (manual code changes required)")
            by_pattern: dict[str, list] = {}
            for f in high_manual:
                by_pattern.setdefault(f["pattern"], []).append(f)
            for pid, findings in sorted(by_pattern.items(), key=lambda x: -len(x[1])):
                title = next((p["title"] for p in PATTERNS if p["id"] == pid), pid)
                files_affected = sorted({f["rel_file"] for f in findings})
                lines.append(f"\n**`{pid}`** × {len(findings)} — {title}")
                lines.append(f"  Files: {', '.join(f'`{f}`' for f in files_affected[:5])}")
                lines.append(f"  > Run `explain_pattern(\"{pid}\")` for the fix pattern")

        # Phase 3: Medium
        medium_manual = [f for f in all_findings if f["severity"] == "MEDIUM" and not _is_pattern_auto_fixable(f["pattern"])]
        if medium_manual:
            by_pattern2: dict[str, int] = {}
            for f in medium_manual:
                by_pattern2[f["pattern"]] = by_pattern2.get(f["pattern"], 0) + 1
            lines.append("\n### Phase 3 — Medium Severity")
            for pid, count in sorted(by_pattern2.items(), key=lambda x: -x[1]):
                title = next((p["title"] for p in PATTERNS if p["id"] == pid), pid)
                lines.append(f"  - `{pid}` × {count} — {title}")

        # Drill-down hints
        lines += [
            "\n---\n",
            "## 🔬 Drill Down with Sub-Agents\n",
            "Call these tools for a full per-file breakdown of each category:\n",
        ]
        group_tool_map = {
            "Data Transfer":            "scan_data_transfer_issues",
            "FlowFields":               "scan_flowfield_issues",
            "Aggregation":              "scan_aggregation_issues",
            "Bulk Operations":          "scan_bulk_operation_issues",
            "Existence Checks":         "scan_existence_check_issues",
            "Locking":                  "scan_locking_issues",
            "Memory / Copies":          "scan_memory_issues",
            "Short-Circuit Evaluation": "scan_short_circuit_issues",
            "Write Patterns":           "scan_write_pattern_issues",
            "Cursor Safety":            "scan_cursor_safety_issues",
            "Stale Reads":              "scan_stale_read_issues",
            "Sort / Keys":              "scan_data_transfer_issues",  # covered by data transfer
        }
        for r in group_results:
            if r["total"] > 0:
                tool = group_tool_map.get(r["group"], "scan_al_workspace")
                lines.append(f"- **{r['group']}** ({r['total']} issues) → `{tool}(\"{folder_path}\")`")

    return "\n".join(lines)


if __name__ == "__main__":
    mcp.run()
'
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
"""
|
|
3
|
+
AL Performance MCP Server
|
|
4
|
+
=========================
|
|
5
|
+
MCP server that scans AL source files for performance anti-patterns
|
|
6
|
+
and applies optimized fixes — based on the BC TechDays 2026 Workshop
|
|
7
|
+
(44 exercises covering real-world AL performance patterns).
|
|
8
|
+
|
|
9
|
+
Tools exposed:
|
|
10
|
+
scan_al_workspace — scan a folder for all performance issues
|
|
11
|
+
fix_al_file — apply all fixes to a single AL file
|
|
12
|
+
fix_al_workspace — apply all fixes to every AL file in a folder
|
|
13
|
+
list_patterns — list all known patterns with descriptions
|
|
14
|
+
explain_pattern — explain a single pattern in depth
|
|
15
|
+
|
|
16
|
+
Usage with Claude Desktop / VS Code Copilot:
|
|
17
|
+
Add to mcp.json (see mcp.json in this folder)
|
|
18
|
+
"""
|
|
19
|
+
|
|
20
|
+
import re
|
|
21
|
+
import json
|
|
22
|
+
from pathlib import Path
|
|
23
|
+
from typing import Any
|
|
24
|
+
|
|
25
|
+
from mcp.server.fastmcp import FastMCP
|
|
26
|
+
|
|
27
|
+
mcp = FastMCP("AL Performance Analyzer")
|
|
28
|
+
|
|
29
|
+
# ---------------------------------------------------------------------------
|
|
30
|
+
# Pattern registry
|
|
31
|
+
# Each entry:
|
|
32
|
+
# id — short identifier used in findings
|
|
33
|
+
# group — category of issue
|
|
34
|
+
# severity — HIGH / MEDIUM / LOW
|
|
35
|
+
# title — one-line description
|
|
36
|
+
# description — full explanation
|
|
37
|
+
# exercises — which workshop exercises cover this
|
|
38
|
+
# detector — callable(text) -> list[dict(line, snippet)]
|
|
39
|
+
# fixer — callable(text) -> str (returns fixed text)
|
|
40
|
+
# ---------------------------------------------------------------------------
|
|
41
|
+
|
|
42
|
+
PATTERNS: list[dict] = []
|
|
43
|
+
|
|
44
|
+
|
|
45
|
+
def _register(id, group, severity, title, description, exercises):
|
|
46
|
+
"""Decorator factory that registers a pattern with its detector and fixer."""
|
|
47
|
+
def decorator(cls):
|
|
48
|
+
PATTERNS.append({
|
|
49
|
+
"id": id,
|
|
50
|
+
"group": group,
|
|
51
|
+
"severity": severity,
|
|
52
|
+
"title": title,
|
|
53
|
+
"description": description,
|
|
54
|
+
"exercises": exercises,
|
|
55
|
+
"detector": cls.detect,
|
|
56
|
+
"fixer": cls.fix,
|
|
57
|
+
})
|
|
58
|
+
return cls
|
|
59
|
+
return decorator
|
|
60
|
+
|
|
61
|
+
|
|
62
|
+
def _find_line(text: str, char_offset: int) -> int:
|
|
63
|
+
return text[:char_offset].count('\n') + 1
|
|
64
|
+
|
|
65
|
+
|
|
66
|
+
def _findings(text: str, pattern: re.Pattern, message_fn=None) -> list[dict]:
|
|
67
|
+
out = []
|
|
68
|
+
for m in pattern.finditer(text):
|
|
69
|
+
line = _find_line(text, m.start())
|
|
70
|
+
snippet = m.group(0).strip()[:120]
|
|
71
|
+
out.append({"line": line, "snippet": snippet, "message": message_fn(m) if message_fn else ""})
|
|
72
|
+
return out
|
|
73
|
+
|
|
74
|
+
|
|
75
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
76
|
+
# PATTERN 01 — Missing SetLoadFields before FindSet / Find
|
|
77
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
78
|
+
@_register(
|
|
79
|
+
id="MISSING_SETLOADFIELDS",
|
|
80
|
+
group="Data Transfer",
|
|
81
|
+
severity="HIGH",
|
|
82
|
+
title="FindSet/Find without SetLoadFields",
|
|
83
|
+
description=('Customer.FindSet() without SetLoadFields generates a SELECT with ALL 100+ fields — including every table extension column joined in. On each row, the NST deserialises a massive buffer it doesn\'t need.\n\nSQL IMPACT: SELECT \\"18\\".\\"timestamp\\",\\"18\\".\\"No_\\",\\"18\\".\\"Name\\"... (all 100+ columns) + JOIN extension tables.\nWith 10 000 customers that\'s gigabytes of needlessly transferred data.\n\nBAD: if Customer.FindSet() then\nGOOD: Customer.SetLoadFields(\\"No.\\", Name, \\"Credit Limit (LCY)\\");\n if Customer.FindSet() then\n\nHINT: Look at the SELECT in SQL Profiler. Count how many columns are fetched. Then add SetLoadFields and compare.'),
|
|
84
|
+
exercises=[1, 2, 33],
|
|
85
|
+
)
|
|
86
|
+
class PatternMissingSetLoadFields:
|
|
87
|
+
# Detect: FindSet/Find on a record variable NOT immediately preceded (within 3 lines) by SetLoadFields
|
|
88
|
+
_FIND = re.compile(r'(\w+)\.(FindSet|FindFirst|FindLast|Find\()', re.MULTILINE)
|
|
89
|
+
|
|
90
|
+
@staticmethod
|
|
91
|
+
def detect(text: str) -> list[dict]:
|
|
92
|
+
findings = []
|
|
93
|
+
lines = text.splitlines()
|
|
94
|
+
for i, line in enumerate(lines):
|
|
95
|
+
m = re.search(r'(\w+)\.(FindSet|FindFirst|FindLast|Find\()', line)
|
|
96
|
+
if not m:
|
|
97
|
+
continue
|
|
98
|
+
var = m.group(1)
|
|
99
|
+
if var.lower() in ('true', 'false', 'result', 'rec'):
|
|
100
|
+
continue
|
|
101
|
+
# Check 3 lines above for SetLoadFields on same var
|
|
102
|
+
context = '\n'.join(lines[max(0, i-3):i])
|
|
103
|
+
if f'{var}.SetLoadFields' not in context and f'{var}.SetAutoCalcFields' not in context:
|
|
104
|
+
# Exclude if in a comment
|
|
105
|
+
stripped = line.strip()
|
|
106
|
+
if stripped.startswith('//'):
|
|
107
|
+
continue
|
|
108
|
+
findings.append({
|
|
109
|
+
"line": i + 1,
|
|
110
|
+
"snippet": line.strip()[:120],
|
|
111
|
+
"message": f"'{var}.{m.group(2)}' called without SetLoadFields"
|
|
112
|
+
})
|
|
113
|
+
return findings
|
|
114
|
+
|
|
115
|
+
@staticmethod
|
|
116
|
+
def fix(text: str) -> str:
|
|
117
|
+
# This pattern requires context-specific fixes (which fields to load)
|
|
118
|
+
# We annotate rather than blindly fix
|
|
119
|
+
return text
|
|
120
|
+
|
|
121
|
+
|
|
122
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
123
|
+
# PATTERN 02 — Find('-') buffer-size-1 anti-pattern
|
|
124
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
125
|
+
@_register(
|
|
126
|
+
id="FIND_DASH_BUFFER_ONE",
|
|
127
|
+
group="Data Transfer",
|
|
128
|
+
severity="HIGH",
|
|
129
|
+
title="Find('-') with buffer size 1 (use FindSet instead)",
|
|
130
|
+
description=("Find('-') pre-fetches only 1 record at a time (read buffer = 1). Each call to Next() fires a new SQL query: SELECT TOP 50 ...\nFor 1 000 entries that is 20 round-trips instead of 1 with FindSet. Find('-') also ignores any previous SetCurrentKey call.\n\nSQL IMPACT: SELECT TOP 50 ... (repeated per Next() batch)\nvs FindSet: single SELECT that pre-fetches rows efficiently.\n\nBAD: if Record.Find('-') then repeat ... until Record.Next() = 0;\nGOOD: if Record.FindSet() then repeat ... until Record.Next() = 0;\n\nHINT: Compare the number of SQL queries for Find('-') vs FindSet on 1 000 rows. Check the Reads column in Profiler."),
|
|
131
|
+
exercises=[2, 24],
|
|
132
|
+
)
|
|
133
|
+
class PatternFindDash:
|
|
134
|
+
_RE = re.compile(r"(\w+)\.Find\('-'\)", re.MULTILINE)
|
|
135
|
+
|
|
136
|
+
@staticmethod
|
|
137
|
+
def detect(text: str) -> list[dict]:
|
|
138
|
+
return _findings(text, PatternFindDash._RE,
|
|
139
|
+
lambda m: f"Use FindSet() instead of {m.group(1)}.Find('-')")
|
|
140
|
+
|
|
141
|
+
@staticmethod
|
|
142
|
+
def fix(text: str) -> str:
|
|
143
|
+
return PatternFindDash._RE.sub(lambda m: f"{m.group(1)}.FindSet()", text)
|
|
144
|
+
|
|
145
|
+
|
|
146
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
147
|
+
# PATTERN 03 — CalcFields inside a loop
|
|
148
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
149
|
+
@_register(
|
|
150
|
+
id="CALCFIELDS_IN_LOOP",
|
|
151
|
+
group="FlowFields",
|
|
152
|
+
severity="HIGH",
|
|
153
|
+
title="CalcFields inside a repeat..until loop",
|
|
154
|
+
description=('Calling CalcFields(Balance) inside a FindSet loop fires one extra SQL sub-query per iteration to compute the FlowField aggregate. For 500 vendors that is 500 extra SQL round-trips just for Balance. SetAutoCalcFields merges the FlowField into the main SELECT.\n\nSQL IMPACT: Per row: SELECT SUM(...) FROM \\"Detailed Vendor Ledg. Entry\\" ... = N additional queries inside the loop.\n\nBAD: repeat Customer.CalcFields(Balance); until Customer.Next() = 0;\nGOOD: Customer.SetAutoCalcFields(Balance);\n if Customer.FindSet() then repeat ... until Customer.Next() = 0;\n\nHINT: Count the extra SQL queries per loop iteration with CalcFields vs AutoCalcFields. Duration difference grows with record count.'),
|
|
155
|
+
exercises=[3],
|
|
156
|
+
)
|
|
157
|
+
class PatternCalcFieldsInLoop:
|
|
158
|
+
_RE = re.compile(r'^\s+\w+\.CalcFields\([^)]+\);', re.MULTILINE)
|
|
159
|
+
|
|
160
|
+
@staticmethod
|
|
161
|
+
def detect(text: str) -> list[dict]:
|
|
162
|
+
findings = []
|
|
163
|
+
lines = text.splitlines()
|
|
164
|
+
in_loop = False
|
|
165
|
+
depth = 0
|
|
166
|
+
for i, line in enumerate(lines):
|
|
167
|
+
stripped = line.strip()
|
|
168
|
+
if stripped.lower() == 'repeat':
|
|
169
|
+
in_loop = True
|
|
170
|
+
depth += 1
|
|
171
|
+
if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE):
|
|
172
|
+
depth -= 1
|
|
173
|
+
if depth <= 0:
|
|
174
|
+
in_loop = False
|
|
175
|
+
if in_loop and re.search(r'\w+\.CalcFields\(', line):
|
|
176
|
+
if not stripped.startswith('//'):
|
|
177
|
+
findings.append({
|
|
178
|
+
"line": i + 1,
|
|
179
|
+
"snippet": line.strip()[:120],
|
|
180
|
+
"message": "CalcFields() inside loop — use SetAutoCalcFields() before FindSet()"
|
|
181
|
+
})
|
|
182
|
+
return findings
|
|
183
|
+
|
|
184
|
+
@staticmethod
|
|
185
|
+
def fix(text: str) -> str:
|
|
186
|
+
return text # Context-specific; needs the variable name
|
|
187
|
+
|
|
188
|
+
|
|
189
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
190
|
+
# PATTERN 04 — Record parameter passed by value (missing var)
|
|
191
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
192
|
+
@_register(
|
|
193
|
+
id="RECORD_BY_VALUE",
|
|
194
|
+
group="Memory / Copies",
|
|
195
|
+
severity="MEDIUM",
|
|
196
|
+
title="Record parameter passed by value instead of var",
|
|
197
|
+
description=('Without VAR, AL copies the entire Record instance into a new memory block: all field values, filter state, cursor position. Large records (Customer, Item) copied on every call. With many nested calls this causes significant GC pressure on NST.\n\nSQL IMPACT: No SQL change — overhead is in NST memory allocation & copy.\n\nBAD: local procedure Foo(Customer: Record Customer)\nGOOD: local procedure Foo(var Customer: Record Customer)\n\nHINT: No SQL difference — measure NST throughput and allocation counters.'),
|
|
198
|
+
exercises=[4],
|
|
199
|
+
)
|
|
200
|
+
class PatternRecordByValue:
|
|
201
|
+
_RE = re.compile(
|
|
202
|
+
r'(local\s+procedure|procedure)\s+\w+\((?:[^)]*,\s*)?(\w+):\s*Record\s+[^;)]+\)',
|
|
203
|
+
re.MULTILINE
|
|
204
|
+
)
|
|
205
|
+
|
|
206
|
+
@staticmethod
|
|
207
|
+
def detect(text: str) -> list[dict]:
|
|
208
|
+
findings = []
|
|
209
|
+
for m in PatternRecordByValue._RE.finditer(text):
|
|
210
|
+
line_text = text[max(0, m.start()-200):m.end()]
|
|
211
|
+
if '(var ' in m.group(0) or re.search(r'\bvar\s+\w+:\s*Record', m.group(0)):
|
|
212
|
+
continue
|
|
213
|
+
if m.group(2) == 'var':
|
|
214
|
+
continue
|
|
215
|
+
line = _find_line(text, m.start())
|
|
216
|
+
findings.append({
|
|
217
|
+
"line": line,
|
|
218
|
+
"snippet": m.group(0)[:120],
|
|
219
|
+
"message": "Record parameter without 'var' — creates a full copy on each call"
|
|
220
|
+
})
|
|
221
|
+
return findings
|
|
222
|
+
|
|
223
|
+
@staticmethod
|
|
224
|
+
def fix(text: str) -> str:
|
|
225
|
+
return text
|
|
226
|
+
|
|
227
|
+
|
|
228
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
229
|
+
# PATTERN 05 — Loop sum instead of CalcSums
|
|
230
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
231
|
+
@_register(
|
|
232
|
+
id="LOOP_SUM_VS_CALCSUMS",
|
|
233
|
+
group="Aggregation",
|
|
234
|
+
severity="HIGH",
|
|
235
|
+
title="Manual summation loop instead of CalcSums",
|
|
236
|
+
description=('Summing a field by iterating all rows in AL: fetches every row from SQL, deserialises it in NST, accumulates in a local variable. CalcSums(Amount) translates to a SQL SUM() aggregate — computed at the database, returns a single row.\n\nSQL IMPACT: Manual loop: SELECT all rows, process N rows in NST\nCalcSums: SELECT SUM(\\"Amount\\") ... — returns 1 row.\n\nBAD: repeat Total += Record.Amount; until Record.Next() = 0;\nGOOD: Record.CalcSums(Amount); Total := Record.Amount;\n\nHINT: CalcSums result: 1 SQL row returned. Loop result: N SQL rows fetched and summed. Check Reads: CalcSums = 1, loop = N.'),
|
|
237
|
+
exercises=[5],
|
|
238
|
+
)
|
|
239
|
+
class PatternLoopSum:
|
|
240
|
+
_RE = re.compile(r'(\w+)\s*\+=\s*\w+\.\w+;', re.MULTILINE)
|
|
241
|
+
|
|
242
|
+
@staticmethod
|
|
243
|
+
def detect(text: str) -> list[dict]:
|
|
244
|
+
findings = []
|
|
245
|
+
lines = text.splitlines()
|
|
246
|
+
in_loop = False
|
|
247
|
+
for i, line in enumerate(lines):
|
|
248
|
+
stripped = line.strip()
|
|
249
|
+
if stripped.lower() == 'repeat':
|
|
250
|
+
in_loop = True
|
|
251
|
+
if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE):
|
|
252
|
+
in_loop = False
|
|
253
|
+
if in_loop and PatternLoopSum._RE.search(line) and not stripped.startswith('//'):
|
|
254
|
+
findings.append({
|
|
255
|
+
"line": i + 1,
|
|
256
|
+
"snippet": line.strip()[:120],
|
|
257
|
+
"message": "Manual += accumulation in loop — consider CalcSums() if summing a single field"
|
|
258
|
+
})
|
|
259
|
+
return findings
|
|
260
|
+
|
|
261
|
+
@staticmethod
|
|
262
|
+
def fix(text: str) -> str:
|
|
263
|
+
return text
|
|
264
|
+
|
|
265
|
+
|
|
266
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
267
|
+
# PATTERN 06 — String concatenation += in loop (use TextBuilder)
|
|
268
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
269
|
+
@_register(
|
|
270
|
+
id="STRING_CONCAT_IN_LOOP",
|
|
271
|
+
group="Memory / Copies",
|
|
272
|
+
severity="HIGH",
|
|
273
|
+
title="Text += string concatenation in loop (O(n²)) — use TextBuilder",
|
|
274
|
+
description=("AL's Text type is a value type. Each += creates a brand-new string object in NST memory — old strings become GC garbage immediately. For N iterations: O(N²) memory allocations and copies. TextBuilder wraps .NET StringBuilder: O(N) time, no intermediate copies.\n\nSQL IMPACT: No SQL impact — pure NST memory pressure & GC overhead.\n\nBAD: CsvContent += BuildDetailLine(...);\nGOOD: var Builder: TextBuilder;\n Builder.Append(BuildDetailLine(...));\n Result := Builder.ToText(); // Single allocation at end\n\nHINT: The GC pressure is invisible in SQL Profiler but shows up in NST memory counters."),
|
|
275
|
+
exercises=[6],
|
|
276
|
+
)
|
|
277
|
+
class PatternStringConcatInLoop:
|
|
278
|
+
_RE = re.compile(r'(\w+)\s*\+=\s*(?![\d.])', re.MULTILINE)
|
|
279
|
+
|
|
280
|
+
@staticmethod
|
|
281
|
+
def detect(text: str) -> list[dict]:
|
|
282
|
+
findings = []
|
|
283
|
+
lines = text.splitlines()
|
|
284
|
+
in_loop = False
|
|
285
|
+
for i, line in enumerate(lines):
|
|
286
|
+
stripped = line.strip()
|
|
287
|
+
if stripped.lower() == 'repeat' or re.search(r'\bforeach\b', stripped, re.IGNORECASE):
|
|
288
|
+
in_loop = True
|
|
289
|
+
if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE) or stripped == 'end;':
|
|
290
|
+
in_loop = False
|
|
291
|
+
if in_loop:
|
|
292
|
+
m = PatternStringConcatInLoop._RE.search(line)
|
|
293
|
+
if m and not stripped.startswith('//'):
|
|
294
|
+
var = m.group(1)
|
|
295
|
+
# Look back to see if it's declared as Text
|
|
296
|
+
context = '\n'.join(lines[max(0, i-30):i])
|
|
297
|
+
if re.search(rf'\b{re.escape(var)}\s*:\s*Text\b', context):
|
|
298
|
+
findings.append({
|
|
299
|
+
"line": i + 1,
|
|
300
|
+
"snippet": line.strip()[:120],
|
|
301
|
+
"message": f"Text += in loop creates O(n²) allocations — use TextBuilder"
|
|
302
|
+
})
|
|
303
|
+
return findings
|
|
304
|
+
|
|
305
|
+
@staticmethod
|
|
306
|
+
def fix(text: str) -> str:
|
|
307
|
+
return text
|
|
308
|
+
|
|
309
|
+
|
|
310
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
311
|
+
# PATTERN 07 — FindSet without (true) when modifying via cursor
|
|
312
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
313
|
+
@_register(
|
|
314
|
+
id="FINDSET_MODIFY_NO_TRUE",
|
|
315
|
+
group="Locking",
|
|
316
|
+
severity="MEDIUM",
|
|
317
|
+
title="FindSet() without (true) when Modify is called on cursor variable",
|
|
318
|
+
description=('FindSet uses ReadUncommitted isolation and pre-fetches rows in batches. Calling Modify inside the loop body can invalidate the cursor position. Records may be visited twice, skipped entirely, or cause deadlocks. The cursor is not designed to survive concurrent DML on the same rows.\n\nSQL IMPACT: SELECT TOP 50 ... (ReadUncommitted) then UPDATE inside — cursor instability.\n\nBAD: if Record.FindSet() then repeat Record.Field := ...; Record.Modify(); ...\nGOOD: if Record.FindSet(true) then repeat Record.Field := ...; Record.Modify(); ...\n\nHINT: Use SQL Profiler to watch which records get updated. Run the anti-pattern twice — some records may be updated twice or skipped.'),
|
|
319
|
+
exercises=[7],
|
|
320
|
+
)
|
|
321
|
+
class PatternFindSetNoForUpdate:
|
|
322
|
+
_RE = re.compile(r'(\w+)\.FindSet\(\)', re.MULTILINE)
|
|
323
|
+
|
|
324
|
+
@staticmethod
|
|
325
|
+
def detect(text: str) -> list[dict]:
|
|
326
|
+
findings = []
|
|
327
|
+
lines = text.splitlines()
|
|
328
|
+
for i, line in enumerate(lines):
|
|
329
|
+
m = PatternFindSetNoForUpdate._RE.search(line)
|
|
330
|
+
if not m or line.strip().startswith('//'):
|
|
331
|
+
continue
|
|
332
|
+
var = m.group(1)
|
|
333
|
+
# Look ahead for Modify on the same var
|
|
334
|
+
ahead = '\n'.join(lines[i:min(len(lines), i+15)])
|
|
335
|
+
if re.search(rf'\b{re.escape(var)}\.Modify\(', ahead):
|
|
336
|
+
findings.append({
|
|
337
|
+
"line": i + 1,
|
|
338
|
+
"snippet": line.strip()[:120],
|
|
339
|
+
"message": f"'{var}.FindSet()' but '{var}.Modify()' found in loop — use FindSet(true)"
|
|
340
|
+
})
|
|
341
|
+
return findings
|
|
342
|
+
|
|
343
|
+
@staticmethod
|
|
344
|
+
def fix(text: str) -> str:
|
|
345
|
+
# Only fix when Modify follows in same loop — conservative approach
|
|
346
|
+
def replace_if_modify_follows(m):
|
|
347
|
+
pos = m.end()
|
|
348
|
+
ahead = text[pos:pos+500]
|
|
349
|
+
var = m.group(1)
|
|
350
|
+
if re.search(rf'\b{re.escape(var)}\.Modify\(', ahead):
|
|
351
|
+
return f"{var}.FindSet(true)"
|
|
352
|
+
return m.group(0)
|
|
353
|
+
return re.sub(r'(\w+)\.FindSet\(\)', replace_if_modify_follows, text)
|
|
354
|
+
|
|
355
|
+
|
|
356
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
357
|
+
# PATTERN 08 — Delete inside a loop (use DeleteAll)
|
|
358
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
359
|
+
@_register(
|
|
360
|
+
id="DELETE_IN_LOOP",
|
|
361
|
+
group="Bulk Operations",
|
|
362
|
+
severity="HIGH",
|
|
363
|
+
title="Record.Delete() inside a loop — use DeleteAll()",
|
|
364
|
+
description=('Same cursor instability as Modify — Delete during FindSet can cause the read cursor to skip or revisit records. DeleteAll is atomic and uses a single DELETE FROM statement. If selective deletion is needed, collect keys first, delete after loop.\n\nSQL IMPACT: SELECT TOP 50 (cursor) + DELETE per row — cursor corruption risk.\nDeleteAll: 1 DELETE FROM statement vs N individual DELETEs.\n\nBAD: if Record.FindSet() then repeat Record.Delete(); until Record.Next() = 0;\nGOOD: Record.SetRange(Active, false); Record.DeleteAll(false);\n\nHINT: Compare the number of DELETE statements in Profiler: DeleteAll = 1 SQL DELETE; loop = N DELETEs.'),
|
|
365
|
+
exercises=[8],
|
|
366
|
+
)
|
|
367
|
+
class PatternDeleteInLoop:
|
|
368
|
+
@staticmethod
|
|
369
|
+
def detect(text: str) -> list[dict]:
|
|
370
|
+
findings = []
|
|
371
|
+
lines = text.splitlines()
|
|
372
|
+
in_loop = False
|
|
373
|
+
loop_var = None
|
|
374
|
+
for i, line in enumerate(lines):
|
|
375
|
+
stripped = line.strip()
|
|
376
|
+
m = re.search(r'(\w+)\.FindSet', line)
|
|
377
|
+
if m and not stripped.startswith('//'):
|
|
378
|
+
in_loop = True
|
|
379
|
+
loop_var = m.group(1)
|
|
380
|
+
if in_loop and loop_var and re.search(rf'\b{re.escape(loop_var)}\.Delete\(', line):
|
|
381
|
+
if not stripped.startswith('//'):
|
|
382
|
+
findings.append({
|
|
383
|
+
"line": i + 1,
|
|
384
|
+
"snippet": line.strip()[:120],
|
|
385
|
+
"message": f"'{loop_var}.Delete()' inside FindSet loop — use '{loop_var}.DeleteAll(false)'"
|
|
386
|
+
})
|
|
387
|
+
if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE):
|
|
388
|
+
in_loop = False
|
|
389
|
+
loop_var = None
|
|
390
|
+
return findings
|
|
391
|
+
|
|
392
|
+
@staticmethod
|
|
393
|
+
def fix(text: str) -> str:
|
|
394
|
+
return text
|
|
395
|
+
|
|
396
|
+
|
|
397
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
398
|
+
# PATTERN 09 — Count() <> 0 instead of not IsEmpty()
|
|
399
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
400
|
+
@_register(
|
|
401
|
+
id="COUNT_NOT_ZERO",
|
|
402
|
+
group="Existence Checks",
|
|
403
|
+
severity="MEDIUM",
|
|
404
|
+
title="Count() <> 0 / Count() > 0 — use IsEmpty() instead",
|
|
405
|
+
description=('Count() generates SELECT COUNT(*) — the database must count ALL matching rows before returning. On large tables this is expensive. IsEmpty() generates IF EXISTS (SELECT TOP 1 NULL ...) — stops at the first match. O(1) vs O(N).\n\nSQL IMPACT: Count(): SELECT COUNT(*) FROM ... → scans entire table\nIsEmpty(): IF EXISTS (SELECT TOP 1 NULL FROM ...) → stops immediately.\n\nBAD: exit(Record.Count() <> 0);\nGOOD: exit(not Record.IsEmpty());\n\nHINT: Compare SQL Profiler output for both. Count() always reads all rows first. IsEmpty stops at the very first match.'),
|
|
406
|
+
exercises=[9, 10, 11],
|
|
407
|
+
)
|
|
408
|
+
class PatternCountNotZero:
|
|
409
|
+
_RE = re.compile(r'(\w+)\.Count\(\)\s*(?:<>|>|=)\s*0', re.MULTILINE)
|
|
410
|
+
|
|
411
|
+
@staticmethod
|
|
412
|
+
def detect(text: str) -> list[dict]:
|
|
413
|
+
return _findings(text, PatternCountNotZero._RE,
|
|
414
|
+
lambda m: f"'{m.group(1)}.Count() != 0' — use IsEmpty() for O(1) existence check")
|
|
415
|
+
|
|
416
|
+
@staticmethod
|
|
417
|
+
def fix(text: str) -> str:
|
|
418
|
+
def replace(m):
|
|
419
|
+
var = m.group(1)
|
|
420
|
+
op = m.group(0).split('Count()')[1].strip().split(' ')[0]
|
|
421
|
+
if op in ('<>', '>'):
|
|
422
|
+
return f'not {var}.IsEmpty()'
|
|
423
|
+
if op == '=':
|
|
424
|
+
return f'{var}.IsEmpty()'
|
|
425
|
+
return m.group(0)
|
|
426
|
+
return PatternCountNotZero._RE.sub(replace, text)
|
|
427
|
+
|
|
428
|
+
|
|
429
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
430
|
+
# PATTERN 10 — Redundant IsEmpty before FindSet (double scan)
|
|
431
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
432
|
+
@_register(
|
|
433
|
+
id="ISEMPTY_BEFORE_FINDSET",
|
|
434
|
+
group="Existence Checks",
|
|
435
|
+
severity="MEDIUM",
|
|
436
|
+
title="Redundant IsEmpty() before FindSet() (two SQL scans instead of one)",
|
|
437
|
+
description=('Checking IsEmpty() immediately before FindSet fires TWO SQL queries: 1) IF EXISTS (SELECT TOP 1 NULL ...) — the IsEmpty check; 2) SELECT TOP 50 ... — the FindSet. FindSet already returns false when no rows match — the IsEmpty is waste.\n\nSQL IMPACT: Query 1: IF EXISTS (SELECT TOP 1 NULL ...). Query 2: SELECT TOP 50 ... → redundant.\n\nBAD: if not Record.IsEmpty() then\n if Record.FindSet() then ...\nGOOD: if Record.FindSet() then ...\n\nHINT: Count the SQL queries in Profiler: IsEmpty + FindSet = 2; just FindSet = 1. The IsEmpty result is ignored by FindSet anyway.'),
|
|
438
|
+
exercises=[11],
|
|
439
|
+
)
|
|
440
|
+
class PatternIsEmptyBeforeFindSet:
|
|
441
|
+
@staticmethod
|
|
442
|
+
def detect(text: str) -> list[dict]:
|
|
443
|
+
findings = []
|
|
444
|
+
lines = text.splitlines()
|
|
445
|
+
for i, line in enumerate(lines):
|
|
446
|
+
if re.search(r'not\s+\w+\.IsEmpty\(\)', line) and not line.strip().startswith('//'):
|
|
447
|
+
# Check next 2 lines for FindSet
|
|
448
|
+
ahead = '\n'.join(lines[i:min(len(lines), i+3)])
|
|
449
|
+
if re.search(r'\.FindSet\(', ahead):
|
|
450
|
+
findings.append({
|
|
451
|
+
"line": i + 1,
|
|
452
|
+
"snippet": line.strip()[:120],
|
|
453
|
+
"message": "Redundant IsEmpty() guard before FindSet() — FindSet() returns false when empty"
|
|
454
|
+
})
|
|
455
|
+
return findings
|
|
456
|
+
|
|
457
|
+
@staticmethod
|
|
458
|
+
def fix(text: str) -> str:
|
|
459
|
+
return re.sub(
|
|
460
|
+
r'[ \t]+if not (\w+)\.IsEmpty\(\) then\s*\n([ \t]+)if \1\.FindSet\(',
|
|
461
|
+
r'\2if \1.FindSet(',
|
|
462
|
+
text
|
|
463
|
+
)
|
|
464
|
+
|
|
465
|
+
|
|
466
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
467
|
+
# PATTERN 11 — Missing 'temporary' keyword on temp table variable
|
|
468
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
469
|
+
@_register(
|
|
470
|
+
id="MISSING_TEMPORARY",
|
|
471
|
+
group="Memory / Copies",
|
|
472
|
+
severity="HIGH",
|
|
473
|
+
title="Temp table variable missing 'temporary' keyword",
|
|
474
|
+
description=('A non-temporary record sends every Insert/Get/Delete to SQL Server. Using a regular table as an in-memory scratchpad causes unnecessary SQL round-trips, transaction log writes, and lock contention. Declaring the variable \'temporary\' keeps all operations in NST memory.\n\nSQL IMPACT: Without temporary: INSERT INTO / SELECT / DELETE — full SQL for each op.\nWith temporary: All operations in NST memory — zero SQL round-trips.\n\nBAD: TempData: Record \\"Workshop Data\\";\nGOOD: TempData: Record \\"Workshop Data\\" temporary;\n\nHINT: Insert 1 000 rows with and without \'temporary\'. Without: watch 1 000 INSERTs in SQL Profiler. With temporary: zero SQL activity.'),
|
|
475
|
+
exercises=[12],
|
|
476
|
+
)
|
|
477
|
+
class PatternMissingTemporary:
|
|
478
|
+
@staticmethod
|
|
479
|
+
def detect(text: str) -> list[dict]:
|
|
480
|
+
findings = []
|
|
481
|
+
lines = text.splitlines()
|
|
482
|
+
for i, line in enumerate(lines):
|
|
483
|
+
# Variable declared with Temp prefix but no 'temporary' keyword
|
|
484
|
+
if re.search(r'\bTemp\w+\s*:\s*Record\s+', line) and 'temporary' not in line and not line.strip().startswith('//'):
|
|
485
|
+
findings.append({
|
|
486
|
+
"line": i + 1,
|
|
487
|
+
"snippet": line.strip()[:120],
|
|
488
|
+
"message": "Variable with 'Temp' prefix is missing 'temporary' keyword"
|
|
489
|
+
})
|
|
490
|
+
return findings
|
|
491
|
+
|
|
492
|
+
@staticmethod
|
|
493
|
+
def fix(text: str) -> str:
|
|
494
|
+
return re.sub(
|
|
495
|
+
r'(Temp\w+\s*:\s*Record\s+[^;]+);(?!\s*//.*temporary)',
|
|
496
|
+
lambda m: m.group(0).rstrip(';') + ' temporary;' if 'temporary' not in m.group(0) else m.group(0),
|
|
497
|
+
text
|
|
498
|
+
)
|
|
499
|
+
|
|
500
|
+
|
|
501
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
502
|
+
# PATTERN 12 — Temp table used as Dictionary (use Dictionary type)
|
|
503
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
504
|
+
@_register(
|
|
505
|
+
id="TEMP_TABLE_AS_DICT",
|
|
506
|
+
group="Memory / Copies",
|
|
507
|
+
severity="MEDIUM",
|
|
508
|
+
title="Temp Record table used as a key-value lookup (use Dictionary instead)",
|
|
509
|
+
description=("Even a 'temporary' table carries record-layer overhead: key indexes, transaction state tracking, schema validation on every operation. For simple key→value mapping (e.g. CustomerNo → SalespersonCode), the built-in Dictionary of [K, V] type has zero DB overhead.\n\nSQL IMPACT: Temp table: key index maintenance, record struct overhead per entry.\nDictionary: direct hash map lookup — O(1) Get/Set, no record overhead.\n\nBAD: TempCustomer: Record Customer temporary; TempCustomer.Insert(); TempCustomer.Get(...);\nGOOD: RoutingMap: Dictionary of [Code[20], Code[20]];\n RoutingMap.Set(..., ...); if RoutingMap.ContainsKey(...) then ...\n\nHINT: Compare Get/Set operations on temp table vs Dictionary. Measure time for 10 000 lookups each way."),
|
|
510
|
+
exercises=[13],
|
|
511
|
+
)
|
|
512
|
+
class PatternTempTableAsDict:
|
|
513
|
+
@staticmethod
|
|
514
|
+
def detect(text: str) -> list[dict]:
|
|
515
|
+
findings = []
|
|
516
|
+
lines = text.splitlines()
|
|
517
|
+
for i, line in enumerate(lines):
|
|
518
|
+
m = re.search(r'(Temp\w+)\s*:\s*Record\s+\S+\s+temporary', line)
|
|
519
|
+
if not m:
|
|
520
|
+
continue
|
|
521
|
+
var = m.group(1)
|
|
522
|
+
# Look ahead for both Insert and Get on same var — classic dict pattern
|
|
523
|
+
rest = '\n'.join(lines[i:min(len(lines), i+60)])
|
|
524
|
+
if re.search(rf'\b{re.escape(var)}\.Insert\(', rest) and re.search(rf'\b{re.escape(var)}\.Get\(', rest):
|
|
525
|
+
findings.append({
|
|
526
|
+
"line": i + 1,
|
|
527
|
+
"snippet": line.strip()[:120],
|
|
528
|
+
"message": f"'{var}' used as key-value store (Insert+Get pattern) — prefer Dictionary of [...]"
|
|
529
|
+
})
|
|
530
|
+
return findings
|
|
531
|
+
|
|
532
|
+
@staticmethod
|
|
533
|
+
def fix(text: str) -> str:
|
|
534
|
+
return text
|
|
535
|
+
|
|
536
|
+
|
|
537
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
538
|
+
# PATTERN 13 — FindFirst() used for loop iteration
|
|
539
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
540
|
+
@_register(
|
|
541
|
+
id="FINDFIRST_IN_LOOP",
|
|
542
|
+
group="Data Transfer",
|
|
543
|
+
severity="HIGH",
|
|
544
|
+
title="FindFirst() used for multi-row iteration (buffer size 1)",
|
|
545
|
+
description=('FindFirst() generates SELECT TOP 1 — fetches exactly one record. When used to start a loop (calling Next() repeatedly), every Next() call that exhausts the buffer fires a new SELECT TOP 50. FindSet() pre-fetches 50 rows immediately — far fewer SQL queries.\n\nSQL IMPACT: FindFirst: SELECT TOP 1 ... then SELECT TOP 50 per batch in Next().\nFindSet: Single SELECT that establishes the full read cursor.\n\nBAD: if Record.FindFirst() then repeat ... until Record.Next() = 0;\nGOOD: if Record.FindSet() then repeat ... until Record.Next() = 0;\n\nHINT: Trace SQL queries for a 500-row loop with FindFirst. FindFirst fires SELECT TOP 1 first, then Next batches. FindSet fires one SELECT and handles batching internally.'),
|
|
546
|
+
exercises=[14],
|
|
547
|
+
)
|
|
548
|
+
class PatternFindFirstInLoop:
|
|
549
|
+
@staticmethod
|
|
550
|
+
def detect(text: str) -> list[dict]:
|
|
551
|
+
findings = []
|
|
552
|
+
lines = text.splitlines()
|
|
553
|
+
for i, line in enumerate(lines):
|
|
554
|
+
m = re.search(r'(\w+)\.FindFirst\(\)', line)
|
|
555
|
+
if not m or line.strip().startswith('//'):
|
|
556
|
+
continue
|
|
557
|
+
var = m.group(1)
|
|
558
|
+
# Look ahead for Next() on same var
|
|
559
|
+
ahead = '\n'.join(lines[i:min(len(lines), i+20)])
|
|
560
|
+
if re.search(rf'\b{re.escape(var)}\.Next\(\)', ahead):
|
|
561
|
+
findings.append({
|
|
562
|
+
"line": i + 1,
|
|
563
|
+
"snippet": line.strip()[:120],
|
|
564
|
+
"message": f"'{var}.FindFirst()' followed by Next() — use FindSet() for multi-row iteration"
|
|
565
|
+
})
|
|
566
|
+
return findings
|
|
567
|
+
|
|
568
|
+
@staticmethod
|
|
569
|
+
def fix(text: str) -> str:
|
|
570
|
+
def replace(m):
|
|
571
|
+
var = m.group(1)
|
|
572
|
+
pos = m.end()
|
|
573
|
+
ahead = text[pos:pos+300]
|
|
574
|
+
if re.search(rf'\b{re.escape(var)}\.Next\(\)', ahead):
|
|
575
|
+
return f"{var}.FindSet()"
|
|
576
|
+
return m.group(0)
|
|
577
|
+
return re.sub(r'(\w+)\.FindFirst\(\)', replace, text)
|
|
578
|
+
|
|
579
|
+
|
|
580
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
581
|
+
# PATTERN 14 — FindSet guard before ModifyAll (unnecessary)
|
|
582
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
583
|
+
@_register(
|
|
584
|
+
id="FINDSET_BEFORE_MODIFYALL",
|
|
585
|
+
group="Bulk Operations",
|
|
586
|
+
severity="MEDIUM",
|
|
587
|
+
title="FindSet() guard before ModifyAll() — unnecessary (double scan)",
|
|
588
|
+
description=('Calling FindSet() immediately before ModifyAll() fires an extra SELECT just to confirm rows exist. ModifyAll() already handles empty result sets gracefully — it does nothing if no rows match the current filters. The FindSet is pure overhead with zero functional benefit.\n\nSQL IMPACT: Extra query: SELECT TOP 50 ... (only to check existence).\nThen: UPDATE ... WHERE ... (ModifyAll — does this anyway).\nWith FindSet: 2 queries (SELECT + UPDATE). Without: 1 query (UPDATE only).\n\nBAD: if Record.FindSet() then Record.ModifyAll(...);\nGOOD: Record.ModifyAll(...);\n\nHINT: Look at SQL before ModifyAll with and without FindSet. With FindSet: 2 queries. Without: 1 query.'),
|
|
589
|
+
exercises=[15],
|
|
590
|
+
)
|
|
591
|
+
class PatternFindSetBeforeModifyAll:
|
|
592
|
+
_RE = re.compile(r'if\s+(\w+)\.FindSet\(\)\s+then\s+\n?\s+\1\.ModifyAll\(', re.MULTILINE)
|
|
593
|
+
|
|
594
|
+
@staticmethod
|
|
595
|
+
def detect(text: str) -> list[dict]:
|
|
596
|
+
return _findings(text, PatternFindSetBeforeModifyAll._RE,
|
|
597
|
+
lambda m: f"FindSet() guard before ModifyAll() on '{m.group(1)}' is redundant")
|
|
598
|
+
|
|
599
|
+
@staticmethod
|
|
600
|
+
def fix(text: str) -> str:
|
|
601
|
+
return re.sub(
|
|
602
|
+
r'if\s+(\w+)\.FindSet\(\)\s+then\s*\n(\s+)\1\.ModifyAll\(',
|
|
603
|
+
r'\2\1.ModifyAll(',
|
|
604
|
+
text
|
|
605
|
+
)
|
|
606
|
+
|
|
607
|
+
|
|
608
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
609
|
+
# PATTERN 15 — SetFilter on FlowField (use SetAutoCalcFields + AL filter)
|
|
610
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
611
|
+
@_register(
|
|
612
|
+
id="SETFILTER_ON_FLOWFIELD",
|
|
613
|
+
group="FlowFields",
|
|
614
|
+
severity="HIGH",
|
|
615
|
+
title="SetFilter on FlowField causes correlated subquery per row",
|
|
616
|
+
description=("SetFilter on a FlowField (e.g. Balance, which is a CalcField) cannot be pushed to the SQL WHERE clause — it has no physical column. BC must fetch ALL rows matching the other filters, then compute the FlowField for each row individually and filter in AL. Full table scan.\n\nSQL IMPACT: SELECT all rows ... then per row: SELECT SUM(...) for FlowField.\nSQL cannot filter on a computed value it hasn't calculated yet.\n\nBAD: Customer.SetFilter(Balance, '>%1', 0); if Customer.FindSet() then ...\nGOOD: Customer.SetAutoCalcFields(Balance);\n if Customer.FindSet() then repeat if Customer.Balance > 0 then ...\n\nHINT: Try SetFilter(Balance, '>1000') — check the SQL WHERE. Balance won't appear in WHERE — all rows fetched. Compare with filtering on a normal indexed decimal field."),
|
|
617
|
+
exercises=[16],
|
|
618
|
+
)
|
|
619
|
+
class PatternSetFilterOnFlowField:
|
|
620
|
+
# Common FlowFields in BC
|
|
621
|
+
_FLOWFIELDS = {'Balance', 'Balance (LCY)', 'Sales (LCY)', 'Purchases (LCY)',
|
|
622
|
+
'Outstanding Orders', 'Outstanding Invoices', 'Net Change'}
|
|
623
|
+
_RE = re.compile(r'(\w+)\.SetFilter\(([^,)]+),', re.MULTILINE)
|
|
624
|
+
|
|
625
|
+
@staticmethod
|
|
626
|
+
def detect(text: str) -> list[dict]:
|
|
627
|
+
findings = []
|
|
628
|
+
for m in PatternSetFilterOnFlowField._RE.finditer(text):
|
|
629
|
+
field = m.group(2).strip().strip('"')
|
|
630
|
+
if field in PatternSetFilterOnFlowField._FLOWFIELDS:
|
|
631
|
+
line = _find_line(text, m.start())
|
|
632
|
+
findings.append({
|
|
633
|
+
"line": line,
|
|
634
|
+
"snippet": m.group(0)[:120],
|
|
635
|
+
"message": f"SetFilter on FlowField '{field}' — use SetAutoCalcFields + AL-side filter"
|
|
636
|
+
})
|
|
637
|
+
return findings
|
|
638
|
+
|
|
639
|
+
@staticmethod
|
|
640
|
+
def fix(text: str) -> str:
|
|
641
|
+
return text
|
|
642
|
+
|
|
643
|
+
|
|
644
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
645
|
+
# PATTERN 16 — OR / AND both sides always evaluated (use nested IF)
|
|
646
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
647
|
+
@_register(
|
|
648
|
+
id="EAGER_EVALUATION_OR_AND",
|
|
649
|
+
group="Short-Circuit Evaluation",
|
|
650
|
+
severity="MEDIUM",
|
|
651
|
+
title="AL 'or'/'and' evaluates both sides eagerly — use nested IF for expensive calls",
|
|
652
|
+
description=('AL evaluates BOTH sides of OR/AND regardless of the left side result. If the left condition calls an expensive function (FindSet, CalcFields), the right side still runs even when left already determines the result. Nested IF statements provide proper short-circuit behavior.\n\nSQL IMPACT: No SQL change — both function calls execute unconditionally.\nWith nested IF: expensive right-side call skipped when left is true/false.\n\nBAD: if ExpensiveA() or ExpensiveB() then\nGOOD: if ExpensiveA() then ProcessResult()\n else if ExpensiveB() then ProcessResult();\n\nHINT: Add trace messages inside each expensive function. Count how many times each is called with OR vs nested IF. Right-side function should not run when left is true.'),
|
|
653
|
+
exercises=[17, 18, 39],
|
|
654
|
+
)
|
|
655
|
+
class PatternEagerEvaluation:
|
|
656
|
+
# Heuristic: function calls as operands of or/and
|
|
657
|
+
_RE = re.compile(r'\b(\w+\([^)]*\))\s+(or|and)\s+(\w+\([^)]*\))', re.MULTILINE | re.IGNORECASE)
|
|
658
|
+
|
|
659
|
+
@staticmethod
|
|
660
|
+
def detect(text: str) -> list[dict]:
|
|
661
|
+
findings = []
|
|
662
|
+
for m in PatternEagerEvaluation._RE.finditer(text):
|
|
663
|
+
if text[max(0, m.start()-2):m.start()].strip().startswith('//'):
|
|
664
|
+
continue
|
|
665
|
+
line = _find_line(text, m.start())
|
|
666
|
+
line_text = text.splitlines()[line-1].strip()
|
|
667
|
+
if line_text.startswith('//'):
|
|
668
|
+
continue
|
|
669
|
+
findings.append({
|
|
670
|
+
"line": line,
|
|
671
|
+
"snippet": m.group(0)[:120],
|
|
672
|
+
"message": f"Eager evaluation: '{m.group(2).upper()}' always evaluates both sides — use nested IF or 'case true of'"
|
|
673
|
+
})
|
|
674
|
+
return findings
|
|
675
|
+
|
|
676
|
+
@staticmethod
|
|
677
|
+
def fix(text: str) -> str:
|
|
678
|
+
return text # Requires understanding of intent
|
|
679
|
+
|
|
680
|
+
|
|
681
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
682
|
+
# PATTERN 17 — SetRange/filter mutation inside FindSet loop
|
|
683
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
684
|
+
@_register(
|
|
685
|
+
id="FILTER_MUTATION_IN_LOOP",
|
|
686
|
+
group="Cursor Safety",
|
|
687
|
+
severity="HIGH",
|
|
688
|
+
title="SetRange/SetFilter inside FindSet loop corrupts cursor",
|
|
689
|
+
description=("Setting a new filter inside a FindSet loop modifies the record variable's filter state. Next() continues on the OLD cursor, not the new filter. Result: records may be missed, wrong data returned, or infinite loop. The cursor position becomes undefined after a SetRange mid-loop.\n\nSQL IMPACT: Cursor established by FindSet, then filter changed → Next() undefined behavior. Hard to reproduce bugs.\n\nBAD: if Rec.FindSet() then repeat Rec.SetRange(Field, Rec.Field); until Rec.Next()=0;\nGOOD: Collect keys into a List first, then process with Get().\n\nHINT: Set a breakpoint inside the loop after SetRange. Watch which records Next() returns after the filter change."),
|
|
690
|
+
exercises=[19],
|
|
691
|
+
)
|
|
692
|
+
class PatternFilterMutationInLoop:
|
|
693
|
+
@staticmethod
|
|
694
|
+
def detect(text: str) -> list[dict]:
|
|
695
|
+
findings = []
|
|
696
|
+
lines = text.splitlines()
|
|
697
|
+
in_loop = False
|
|
698
|
+
loop_var = None
|
|
699
|
+
for i, line in enumerate(lines):
|
|
700
|
+
m = re.search(r'(\w+)\.FindSet', line)
|
|
701
|
+
if m and not line.strip().startswith('//'):
|
|
702
|
+
in_loop = True
|
|
703
|
+
loop_var = m.group(1)
|
|
704
|
+
if in_loop and loop_var:
|
|
705
|
+
if re.search(rf'\b{re.escape(loop_var)}\.(SetRange|SetFilter)\(', line) and not line.strip().startswith('//'):
|
|
706
|
+
findings.append({
|
|
707
|
+
"line": i + 1,
|
|
708
|
+
"snippet": line.strip()[:120],
|
|
709
|
+
"message": f"'{loop_var}.SetRange/SetFilter' inside FindSet loop — corrupts cursor"
|
|
710
|
+
})
|
|
711
|
+
if re.match(r'until\s+\w+\.Next\(\)', line.strip(), re.IGNORECASE):
|
|
712
|
+
in_loop = False
|
|
713
|
+
loop_var = None
|
|
714
|
+
return findings
|
|
715
|
+
|
|
716
|
+
@staticmethod
|
|
717
|
+
def fix(text: str) -> str:
|
|
718
|
+
return text
|
|
719
|
+
|
|
720
|
+
|
|
721
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
722
|
+
# PATTERN 18 — FindSet before DeleteAll (unnecessary guard)
|
|
723
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
724
|
+
@_register(
|
|
725
|
+
id="FINDSET_BEFORE_DELETEALL",
|
|
726
|
+
group="Bulk Operations",
|
|
727
|
+
severity="MEDIUM",
|
|
728
|
+
title="FindSet() guard before DeleteAll() is redundant",
|
|
729
|
+
description=('Same anti-pattern as FindSet before ModifyAll — calling FindSet() before DeleteAll() fires an extra SELECT just to verify rows exist. DeleteAll() already handles empty result sets — it does nothing.\n\nSQL IMPACT: Extra query: SELECT TOP 50 ... (only to check existence).\nThen: DELETE FROM ... WHERE ... (DeleteAll — does this anyway).\nFindSet before DeleteAll = 2 SQL queries. Just DeleteAll = 1 SQL DELETE statement.\n\nBAD: if Record.FindSet() then Record.DeleteAll();\nGOOD: Record.DeleteAll();\n\nHINT: Same as FindSet before ModifyAll but for DeleteAll. With FindSet: 2 queries. Without: 1 DELETE statement.'),
|
|
730
|
+
exercises=[20],
|
|
731
|
+
)
|
|
732
|
+
class PatternFindSetBeforeDeleteAll:
|
|
733
|
+
_RE = re.compile(r'if\s+(\w+)\.FindSet\(\)\s+then\s*\n?\s*\1\.DeleteAll\(', re.MULTILINE)
|
|
734
|
+
|
|
735
|
+
@staticmethod
|
|
736
|
+
def detect(text: str) -> list[dict]:
|
|
737
|
+
return _findings(text, PatternFindSetBeforeDeleteAll._RE,
|
|
738
|
+
lambda m: f"FindSet() guard before DeleteAll() on '{m.group(1)}' is redundant")
|
|
739
|
+
|
|
740
|
+
@staticmethod
|
|
741
|
+
def fix(text: str) -> str:
|
|
742
|
+
return re.sub(
|
|
743
|
+
r'if\s+(\w+)\.FindSet\(\)\s+then\s*\n(\s+)\1\.DeleteAll\(',
|
|
744
|
+
r'\2\1.DeleteAll(',
|
|
745
|
+
text
|
|
746
|
+
)
|
|
747
|
+
|
|
748
|
+
|
|
749
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
750
|
+
# PATTERN 19 — DeleteAll without IsEmpty guard on lock-sensitive records
|
|
751
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
752
|
+
@_register(
|
|
753
|
+
id="DELETEALL_NO_ISEMPTY_GUARD",
|
|
754
|
+
group="Locking",
|
|
755
|
+
severity="LOW",
|
|
756
|
+
title="DeleteAll() without IsEmpty guard acquires write lock even when empty",
|
|
757
|
+
description=('DeleteAll() on an empty (or likely-empty) table still fires a DELETE FROM ... SQL statement — acquiring a write lock even if there are zero rows to delete. Under high concurrency, unnecessary lock acquisition causes contention.\n\nSQL IMPACT: DELETE FROM ... WHERE ... → acquires write lock even if 0 rows affected.\nIsEmpty guard: IF EXISTS check first → skip DELETE if empty.\n\nCONSIDER: if not Record.IsEmpty() then Record.DeleteAll(false);\n\nHINT: Call DeleteAll on an empty table in SQL Profiler. Without guard: DELETE fires even with 0 rows. With IsEmpty guard: DELETE skipped entirely.'),
|
|
758
|
+
exercises=[21],
|
|
759
|
+
)
|
|
760
|
+
class PatternDeleteAllNoGuard:
|
|
761
|
+
@staticmethod
|
|
762
|
+
def detect(text: str) -> list[dict]:
|
|
763
|
+
findings = []
|
|
764
|
+
lines = text.splitlines()
|
|
765
|
+
for i, line in enumerate(lines):
|
|
766
|
+
m = re.search(r'(\w+)\.DeleteAll\(', line)
|
|
767
|
+
if not m or line.strip().startswith('//'):
|
|
768
|
+
continue
|
|
769
|
+
var = m.group(1)
|
|
770
|
+
# Check 2 lines above for IsEmpty guard on same var
|
|
771
|
+
context = '\n'.join(lines[max(0, i-2):i])
|
|
772
|
+
if f'{var}.IsEmpty' not in context:
|
|
773
|
+
findings.append({
|
|
774
|
+
"line": i + 1,
|
|
775
|
+
"snippet": line.strip()[:120],
|
|
776
|
+
"message": f"Consider 'if not {var}.IsEmpty() then' guard before DeleteAll() to avoid locking on empty sets"
|
|
777
|
+
})
|
|
778
|
+
return findings
|
|
779
|
+
|
|
780
|
+
@staticmethod
|
|
781
|
+
def fix(text: str) -> str:
|
|
782
|
+
return text
|
|
783
|
+
|
|
784
|
+
|
|
785
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
786
|
+
# PATTERN 20 — Count() = 1 "exactly one" check (use FindFirst + Next)
|
|
787
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
788
|
+
@_register(
|
|
789
|
+
id="COUNT_EQUALS_ONE",
|
|
790
|
+
group="Existence Checks",
|
|
791
|
+
severity="MEDIUM",
|
|
792
|
+
title="Count() = 1 to check uniqueness scans entire set",
|
|
793
|
+
description=("Count() = 1 requires the database to count ALL matching rows. To check 'exactly one record exists', you only need to fetch two rows: FindFirst() gets the first, Next() = 0 confirms there is no second. Maximum 2 row reads.\n\nSQL IMPACT: Count() = 1: SELECT COUNT(*) FROM ... → full table scan.\nFindFirst + Next: SELECT TOP 1 then SELECT TOP 1 → max 2 rows read.\n\nBAD: exit(Record.Count() = 1);\nGOOD: if Record.FindFirst() then exit(Record.Next() = 0)\n else exit(false);\n\nHINT: Compare SQL for Count()=1 vs FindFirst+Next approach. Count() reads entire matching set. FindFirst+Next reads at most 2 rows."),
|
|
794
|
+
exercises=[22],
|
|
795
|
+
)
|
|
796
|
+
class PatternCountEqualsOne:
|
|
797
|
+
_RE = re.compile(r'(\w+)\.Count\(\)\s*=\s*1', re.MULTILINE)
|
|
798
|
+
|
|
799
|
+
@staticmethod
|
|
800
|
+
def detect(text: str) -> list[dict]:
|
|
801
|
+
return _findings(text, PatternCountEqualsOne._RE,
|
|
802
|
+
lambda m: f"Count() = 1 scans entire set — use FindFirst() + Next() = 0")
|
|
803
|
+
|
|
804
|
+
@staticmethod
|
|
805
|
+
def fix(text: str) -> str:
|
|
806
|
+
def replace(m):
|
|
807
|
+
var = m.group(1)
|
|
808
|
+
# Look at context to see if it's in an exit()
|
|
809
|
+
return f'{var}.FindFirst() and ({var}.Next() = 0)'
|
|
810
|
+
return PatternCountEqualsOne._RE.sub(replace, text)
|
|
811
|
+
|
|
812
|
+
|
|
813
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
814
|
+
# PATTERN 21 — Insert-on-conflict pattern (try Insert first, Modify on fail)
|
|
815
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
816
|
+
@_register(
|
|
817
|
+
id="INSERT_ON_CONFLICT",
|
|
818
|
+
group="Write Patterns",
|
|
819
|
+
severity="MEDIUM",
|
|
820
|
+
title="Insert-on-conflict anti-pattern (try Insert, Modify on fail)",
|
|
821
|
+
description=('The Insert always fires. On duplicate key, SQL raises a constraint error that is caught and triggers a Modify. Error handling in SQL is extremely expensive — each conflict = a rolled-back statement + error event.\n\nSQL IMPACT: On conflict: INSERT (fails) → SQL error → error handling → UPDATE.\nWith Get: SELECT (1 row) → branch → INSERT or UPDATE (no errors).\n\nBAD: if not Record.Insert(false) then Record.Modify(false);\nGOOD: if Record.Get(KeyValue) then Record.Modify(false)\n else begin Record.Init(); Record.Insert(false); end;\n\nHINT: On conflict: INSERT path fires a SQL error event — visible in Profiler. Get+branch: no error events.'),
|
|
822
|
+
exercises=[23],
|
|
823
|
+
)
|
|
824
|
+
class PatternInsertOnConflict:
|
|
825
|
+
_RE = re.compile(r'if not \w+\.Insert\((?:false|true)?\) then\s+\w+\.Modify\(', re.MULTILINE)
|
|
826
|
+
|
|
827
|
+
@staticmethod
|
|
828
|
+
def detect(text: str) -> list[dict]:
|
|
829
|
+
return _findings(text, PatternInsertOnConflict._RE,
|
|
830
|
+
lambda m: "Insert-on-fail pattern — use Get() then Modify/Insert for clarity and efficiency")
|
|
831
|
+
|
|
832
|
+
@staticmethod
|
|
833
|
+
def fix(text: str) -> str:
|
|
834
|
+
return text
|
|
835
|
+
|
|
836
|
+
|
|
837
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
838
|
+
# PATTERN 22 — SetCurrentKey missing for sorted iteration
|
|
839
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
840
|
+
@_register(
|
|
841
|
+
id="MISSING_SETCURRENTKEY",
|
|
842
|
+
group="Sort / Keys",
|
|
843
|
+
severity="MEDIUM",
|
|
844
|
+
title="Find('-') or FindSet without SetCurrentKey when order matters",
|
|
845
|
+
description=('Find(\'-\') always reads in PRIMARY KEY ascending order, regardless of any SetCurrentKey call made before it. To read data in a specific sort order, use FindSet() after SetCurrentKey and (for descending) SetAscending(false).\n\nSQL IMPACT: Find(\'-\'): always ORDER BY primary key ASC — SetCurrentKey ignored.\nFindSet with SetAscending: ORDER BY <key> DESC — correct ordering.\n\nBAD: Record.SetCurrentKey(\\"Posting Date\\"); if Record.Find(\'-\') then ...\nGOOD: Record.SetCurrentKey(\\"Posting Date\\");\n Record.SetAscending(\\"Posting Date\\", false);\n if Record.FindSet() then ...\n\nHINT: Check ORDER BY in SQL after Find(\'-\') with SetCurrentKey. SetCurrentKey is ignored — ORDER BY uses primary key.'),
|
|
846
|
+
exercises=[24],
|
|
847
|
+
)
|
|
848
|
+
class PatternMissingSetCurrentKey:
|
|
849
|
+
@staticmethod
|
|
850
|
+
def detect(text: str) -> list[dict]:
|
|
851
|
+
return [] # Covered by FIND_DASH_BUFFER_ONE; too context-specific to detect generically
|
|
852
|
+
|
|
853
|
+
@staticmethod
|
|
854
|
+
def fix(text: str) -> str:
|
|
855
|
+
return text
|
|
856
|
+
|
|
857
|
+
|
|
858
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
859
|
+
# PATTERN 23 — Temp table as collection (use List/Dictionary)
|
|
860
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
861
|
+
@_register(
|
|
862
|
+
id="TEMP_TABLE_AS_COLLECTION",
|
|
863
|
+
group="Memory / Copies",
|
|
864
|
+
severity="MEDIUM",
|
|
865
|
+
title="Temporary table used purely as a collection (use List or Dictionary)",
|
|
866
|
+
description=('Using a temporary table purely to collect distinct scalar values (dates, IDs, codes) carries full record-layer overhead: schema validation, key index maintenance, Init/Insert/FindSet calls. List of [T] is a native AL type with zero record overhead.\n\nSQL IMPACT: Temp table Insert/FindSet: record struct overhead per value.\nList of [Date]: direct array access, no schema, no key lookup.\n\nBAD: TempDates: Record \\"Workshop Data\\" temporary; TempDates.\\"Posting Date\\" := ...; TempDates.Insert();\nGOOD: Dates: List of [Date]; if not Dates.Contains(PostingDate) then Dates.Add(PostingDate);\n\nHINT: Compare temp table Insert/FindSet vs List.Add/iteration. Temp table: schema overhead even in memory. List: pure NST memory array.'),
|
|
867
|
+
exercises=[25],
|
|
868
|
+
)
|
|
869
|
+
class PatternTempTableAsCollection:
|
|
870
|
+
@staticmethod
|
|
871
|
+
def detect(text: str) -> list[dict]:
|
|
872
|
+
findings = []
|
|
873
|
+
lines = text.splitlines()
|
|
874
|
+
for i, line in enumerate(lines):
|
|
875
|
+
m = re.search(r'(Temp\w+)\s*:\s*Record\s+\S+\s+temporary', line)
|
|
876
|
+
if not m:
|
|
877
|
+
continue
|
|
878
|
+
var = m.group(1)
|
|
879
|
+
rest = '\n'.join(lines[i:min(len(lines), i+80)])
|
|
880
|
+
# Pure collection: Insert without reading back meaningful fields
|
|
881
|
+
has_insert = bool(re.search(rf'\b{re.escape(var)}\.Insert\(', rest))
|
|
882
|
+
has_get = bool(re.search(rf'\b{re.escape(var)}\.Get\(', rest))
|
|
883
|
+
has_setrange = bool(re.search(rf'\b{re.escape(var)}\.SetRange\(', rest))
|
|
884
|
+
if has_insert and has_setrange and not has_get:
|
|
885
|
+
findings.append({
|
|
886
|
+
"line": i + 1,
|
|
887
|
+
"snippet": line.strip()[:120],
|
|
888
|
+
"message": f"'{var}' used as collection (Insert+SetRange, no Get) — use List of [...] instead"
|
|
889
|
+
})
|
|
890
|
+
return findings
|
|
891
|
+
|
|
892
|
+
@staticmethod
|
|
893
|
+
def fix(text: str) -> str:
|
|
894
|
+
return text
|
|
895
|
+
|
|
896
|
+
|
|
897
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
898
|
+
# PATTERN 24 — FindLast / FindFirst inside a loop
|
|
899
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
900
|
+
@_register(
|
|
901
|
+
id="FINDLAST_IN_LOOP",
|
|
902
|
+
group="Data Transfer",
|
|
903
|
+
severity="HIGH",
|
|
904
|
+
title="FindLast()/FindFirst() inside a loop (call once before the loop)",
|
|
905
|
+
description=('Calling FindLast() inside a loop to determine the next Entry No. fires SELECT MAX(\\"Entry No_\\") ... or ORDER BY DESC FETCH 1 on EVERY iteration. For 5 000 lines that is 5 000 SQL round-trips for a counter. One FindLast() before the loop + a local counter is O(1).\n\nSQL IMPACT: Per iteration: SELECT TOP 1 ... ORDER BY \\"Entry No_\\" DESC = N SQL queries.\n\nBAD: foreach Line in ImportSource do begin Record.FindLast(); NextNo := Record.\\"Entry No.\\" + 1; ...\nGOOD: Record.FindLast(); NextNo := Record.\\"Entry No.\\" + 1;\n foreach Line in ImportSource do begin NextNo += 1; ... end;\n\nHINT: Trace FindLast() calls in the loop with SQL Profiler. Each iteration fires ORDER BY DESC FETCH 1. Single FindLast before loop: 1 SQL query total.'),
|
|
906
|
+
exercises=[26],
|
|
907
|
+
)
|
|
908
|
+
class PatternFindLastInLoop:
|
|
909
|
+
@staticmethod
|
|
910
|
+
def detect(text: str) -> list[dict]:
|
|
911
|
+
findings = []
|
|
912
|
+
lines = text.splitlines()
|
|
913
|
+
in_loop = False
|
|
914
|
+
for i, line in enumerate(lines):
|
|
915
|
+
stripped = line.strip()
|
|
916
|
+
if re.search(r'\bforeach\b|\brepeat\b', stripped, re.IGNORECASE):
|
|
917
|
+
in_loop = True
|
|
918
|
+
if re.match(r'until\s+\w+\.Next\(\)', stripped, re.IGNORECASE) or (stripped == 'end;' and in_loop):
|
|
919
|
+
in_loop = False
|
|
920
|
+
if in_loop and re.search(r'\w+\.(FindLast|FindFirst)\(\)', line) and not stripped.startswith('//'):
|
|
921
|
+
findings.append({
|
|
922
|
+
"line": i + 1,
|
|
923
|
+
"snippet": line.strip()[:120],
|
|
924
|
+
"message": "FindLast/FindFirst inside loop — call once before the loop and cache the result"
|
|
925
|
+
})
|
|
926
|
+
return findings
|
|
927
|
+
|
|
928
|
+
@staticmethod
|
|
929
|
+
def fix(text: str) -> str:
|
|
930
|
+
return text
|
|
931
|
+
|
|
932
|
+
|
|
933
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
934
|
+
# PATTERN 25 — LockTable + FindLast for sequence generation (use NumberSequence)
|
|
935
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
936
|
+
@_register(
|
|
937
|
+
id="LOCKTABLE_FOR_SEQUENCE",
|
|
938
|
+
group="Locking",
|
|
939
|
+
severity="HIGH",
|
|
940
|
+
title="LockTable + FindLast for sequence numbers — use NumberSequence",
|
|
941
|
+
description=("LockTable() acquires a full table-level exclusive write lock held for the entire transaction. Any concurrent session needing this table blocks. Under high-volume processing (hundreds of operations per minute) this creates lock wait queues and eventual timeout errors.\n\nSQL IMPACT: LockTable: X-lock on entire table for transaction duration.\nNumberSequence.Next(): atomic counter at DB level — no table lock.\n\nBAD: Record.LockTable(true); if Record.FindLast() then NextNo := Record.PK + 1;\nGOOD: if not NumberSequence.Exists('MY_SEQ') then NumberSequence.Insert('MY_SEQ',1,1,false);\n NextNo := NumberSequence.Next('MY_SEQ');\n\nHINT: LockTable: watch lock events in SQL Profiler. NumberSequence: no table lock — atomic sequence increment. Compare concurrency: run two sessions simultaneously."),
|
|
942
|
+
exercises=[28],
|
|
943
|
+
)
|
|
944
|
+
class PatternLockTableForSequence:
|
|
945
|
+
@staticmethod
|
|
946
|
+
def detect(text: str) -> list[dict]:
|
|
947
|
+
findings = []
|
|
948
|
+
lines = text.splitlines()
|
|
949
|
+
for i, line in enumerate(lines):
|
|
950
|
+
if re.search(r'\w+\.LockTable\(', line) and not line.strip().startswith('//'):
|
|
951
|
+
# Look ahead for FindLast to get next key
|
|
952
|
+
ahead = '\n'.join(lines[i:min(len(lines), i+8)])
|
|
953
|
+
if re.search(r'FindLast\(\)', ahead) and re.search(r'Entry No|NextSeq|NextNo|NextKey', ahead, re.IGNORECASE):
|
|
954
|
+
findings.append({
|
|
955
|
+
"line": i + 1,
|
|
956
|
+
"snippet": line.strip()[:120],
|
|
957
|
+
"message": "LockTable + FindLast for sequence generation — use NumberSequence.Next() instead"
|
|
958
|
+
})
|
|
959
|
+
return findings
|
|
960
|
+
|
|
961
|
+
@staticmethod
|
|
962
|
+
def fix(text: str) -> str:
|
|
963
|
+
return text
|
|
964
|
+
|
|
965
|
+
|
|
966
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
967
|
+
# PATTERN 26 — SetRange on PK + FindFirst instead of Get
|
|
968
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
969
|
+
@_register(
|
|
970
|
+
id="SETRANGE_FINDSET_FOR_GET",
|
|
971
|
+
group="Data Transfer",
|
|
972
|
+
severity="MEDIUM",
|
|
973
|
+
title="SetRange on PK + FindFirst instead of direct Get()",
|
|
974
|
+
description=('SetRange on a primary key field followed by FindFirst() goes through the filter+scan path instead of the optimized single-row lookup. Get() uses the primary key index directly — no cursor setup, hits the clustered index directly.\n\nSQL IMPACT: SetRange+FindFirst: SELECT TOP 50 ... WHERE \\"No_\\"=X (cursor setup overhead).\nGet(): Direct clustered index point lookup — no cursor. Measurably faster in high-frequency loops.\n\nBAD: Customer.SetRange(\\"No.\\", CustomerNo); if Customer.FindFirst() then ...\nGOOD: if Customer.Get(CustomerNo) then ...\n\nHINT: Compare SELECT TOP 50 (SetRange+FindFirst) vs direct lookup. Get() hits clustered index directly — 1 read, no cursor.'),
|
|
975
|
+
exercises=[29],
|
|
976
|
+
)
|
|
977
|
+
class PatternSetRangeFindFirstForGet:
|
|
978
|
+
@staticmethod
|
|
979
|
+
def detect(text: str) -> list[dict]:
|
|
980
|
+
findings = []
|
|
981
|
+
lines = text.splitlines()
|
|
982
|
+
for i, line in enumerate(lines):
|
|
983
|
+
m = re.search(r'(\w+)\.SetRange\("No\.",\s*\w+\)', line)
|
|
984
|
+
if not m or line.strip().startswith('//'):
|
|
985
|
+
continue
|
|
986
|
+
var = m.group(1)
|
|
987
|
+
ahead = '\n'.join(lines[i:min(len(lines), i+3)])
|
|
988
|
+
if re.search(rf'\b{re.escape(var)}\.FindFirst\(\)', ahead):
|
|
989
|
+
findings.append({
|
|
990
|
+
"line": i + 1,
|
|
991
|
+
"snippet": line.strip()[:120],
|
|
992
|
+
"message": f"'{var}.SetRange(\"No.\", ...) + FindFirst()' — use '{var}.Get(...)' directly"
|
|
993
|
+
})
|
|
994
|
+
return findings
|
|
995
|
+
|
|
996
|
+
@staticmethod
|
|
997
|
+
def fix(text: str) -> str:
|
|
998
|
+
return text
|
|
999
|
+
|
|
1000
|
+
|
|
1001
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1002
|
+
# PATTERN 27 — Silent Insert failure (if Insert then)
|
|
1003
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1004
|
+
@_register(
|
|
1005
|
+
id="SILENT_INSERT_FAILURE",
|
|
1006
|
+
group="Write Patterns",
|
|
1007
|
+
severity="MEDIUM",
|
|
1008
|
+
title="'if Record.Insert(false) then' silently swallows duplicate-key errors",
|
|
1009
|
+
description=("In AL, Insert(false) does NOT suppress the SQL unique constraint error — it still propagates. Wrapping it in 'if ... then' gives a false sense that the failure is handled. In practice the record silently isn't created and the caller never knows, leading to data integrity gaps.\n\nSQL IMPACT: SQL unique constraint error still raised — 'if then' doesn't catch SQL errors.\nSilent failure → missing records → integrity gap.\n\nBAD: if Record.Insert(false) then MovementCount += 1;\nGOOD: Record.Insert(false); MovementCount += 1;\n\nHINT: Insert a duplicate key row with 'if Insert then'. Check SQL Profiler — does the error appear? The record is not created but no AL error raised."),
|
|
1010
|
+
exercises=[30],
|
|
1011
|
+
)
|
|
1012
|
+
class PatternSilentInsertFailure:
|
|
1013
|
+
_RE = re.compile(r'if\s+\w+\.Insert\((?:false|true)\)\s+then', re.MULTILINE)
|
|
1014
|
+
|
|
1015
|
+
@staticmethod
|
|
1016
|
+
def detect(text: str) -> list[dict]:
|
|
1017
|
+
return _findings(text, PatternSilentInsertFailure._RE,
|
|
1018
|
+
lambda m: "Silent Insert — errors won't surface. Use plain Insert() or handle explicitly")
|
|
1019
|
+
|
|
1020
|
+
@staticmethod
|
|
1021
|
+
def fix(text: str) -> str:
|
|
1022
|
+
return text
|
|
1023
|
+
|
|
1024
|
+
|
|
1025
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1026
|
+
# PATTERN 28 — LockTable too early (before read-only phase)
|
|
1027
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1028
|
+
@_register(
|
|
1029
|
+
id="LOCKTABLE_TOO_EARLY",
|
|
1030
|
+
group="Locking",
|
|
1031
|
+
severity="HIGH",
|
|
1032
|
+
title="LockTable() called before read phase — holds write lock during reads",
|
|
1033
|
+
description=('LockTable() at the top of a procedure holds an exclusive lock through the entire validation / read phase — which may take seconds on large data. Every other session needing this table is blocked for the full duration. The lock is only needed at the moment of the first write.\n\nSQL IMPACT: X-lock held from top of proc through entire read phase (seconds).\nvs. X-lock acquired just before first Modify (milliseconds).\n\nBAD: WorkshopData.LockTable(); ... if WorkshopData.FindSet() then [read loop] ...\nGOOD: [read loop without lock] ... WorkshopData.LockTable(); [write phase only]\n\nHINT: Use Activity Monitor or Profiler lock events. LockTable at start: X-lock held during entire read phase. LockTable at write phase: X-lock held for milliseconds only.'),
|
|
1034
|
+
exercises=[31, 42],
|
|
1035
|
+
)
|
|
1036
|
+
class PatternLockTableTooEarly:
|
|
1037
|
+
@staticmethod
|
|
1038
|
+
def detect(text: str) -> list[dict]:
|
|
1039
|
+
findings = []
|
|
1040
|
+
lines = text.splitlines()
|
|
1041
|
+
for i, line in enumerate(lines):
|
|
1042
|
+
if re.search(r'\w+\.LockTable\(', line) and not line.strip().startswith('//'):
|
|
1043
|
+
# Check if FindSet follows (read phase)
|
|
1044
|
+
ahead = '\n'.join(lines[i:min(len(lines), i+15)])
|
|
1045
|
+
if re.search(r'\.FindSet\(\)', ahead):
|
|
1046
|
+
findings.append({
|
|
1047
|
+
"line": i + 1,
|
|
1048
|
+
"snippet": line.strip()[:120],
|
|
1049
|
+
"message": "LockTable() before FindSet — move lock closer to the write operation"
|
|
1050
|
+
})
|
|
1051
|
+
return findings
|
|
1052
|
+
|
|
1053
|
+
@staticmethod
|
|
1054
|
+
def fix(text: str) -> str:
|
|
1055
|
+
return text
|
|
1056
|
+
|
|
1057
|
+
|
|
1058
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1059
|
+
# PATTERN 29 — Missing ReadIsolation (dirty reads safe = ReadUncommitted)
|
|
1060
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1061
|
+
@_register(
|
|
1062
|
+
id="MISSING_READ_ISOLATION",
|
|
1063
|
+
group="Locking",
|
|
1064
|
+
severity="MEDIUM",
|
|
1065
|
+
title="FindSet on reporting/read-only query without ReadIsolation = ReadUncommitted",
|
|
1066
|
+
description=('Read-only analytics FindSet acquires Shared (S) locks on every fetched page. Concurrent warehouse write sessions hold Exclusive (X) locks on same rows. Result: analytics blocks postings, postings block analytics. On a 50 000-row scan, S-locks are held for several seconds.\n\nSQL IMPACT: Default isolation: Shared (S) locks per page fetched.\nReadUncommitted: NO lock acquisition — readers never block writers.\n\nGOOD: WorkshopData.ReadIsolation := IsolationLevel::ReadUncommitted;\n if WorkshopData.FindSet() then ...\n\nHINT: Without ReadUncommitted: watch S-lock events per page in SQL Profiler. With ReadUncommitted: zero S-lock events — readers invisible. Never use for financial postings or validation.'),
|
|
1067
|
+
exercises=[34],
|
|
1068
|
+
)
|
|
1069
|
+
class PatternMissingReadIsolation:
|
|
1070
|
+
@staticmethod
|
|
1071
|
+
def detect(text: str) -> list[dict]:
|
|
1072
|
+
findings = []
|
|
1073
|
+
lines = text.splitlines()
|
|
1074
|
+
for i, line in enumerate(lines):
|
|
1075
|
+
if re.search(r'\w+\.FindSet\(\)', line) and not line.strip().startswith('//'):
|
|
1076
|
+
# Procedure name suggests reporting
|
|
1077
|
+
context_above = '\n'.join(lines[max(0, i-30):i])
|
|
1078
|
+
if re.search(r'Report|Dashboard|Export|Build.*Report|Snapshot', context_above, re.IGNORECASE):
|
|
1079
|
+
if 'ReadIsolation' not in context_above:
|
|
1080
|
+
findings.append({
|
|
1081
|
+
"line": i + 1,
|
|
1082
|
+
"snippet": line.strip()[:120],
|
|
1083
|
+
"message": "Reporting FindSet without ReadIsolation := ReadUncommitted — may block concurrent writes"
|
|
1084
|
+
})
|
|
1085
|
+
return findings
|
|
1086
|
+
|
|
1087
|
+
@staticmethod
|
|
1088
|
+
def fix(text: str) -> str:
|
|
1089
|
+
return text
|
|
1090
|
+
|
|
1091
|
+
|
|
1092
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1093
|
+
# PATTERN 30 — RecordRef/FieldRef when typed Record is sufficient
|
|
1094
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1095
|
+
@_register(
|
|
1096
|
+
id="RECORDREF_WHEN_TYPED_SUFFICIENT",
|
|
1097
|
+
group="Memory / Copies",
|
|
1098
|
+
severity="LOW",
|
|
1099
|
+
title="RecordRef/FieldRef used when a typed Record variable would suffice",
|
|
1100
|
+
description=('RecordRef provides late-bound, reflection-based table access. Each Field() call does a dictionary lookup + type boxing. SQL generation is less optimized than for typed Record variables. Benchmarks show 3–5x slower reads than typed Record on same data.\n\nSQL IMPACT: RecordRef: Field() lookup + boxing overhead per field per row.\nTyped Record: direct field access, compiler-optimized SQL.\n\nBAD: RecRef: RecordRef; RecRef.Open(Database::\\"Workshop Data\\"); RecRef.Field(2).Value := ...;\nGOOD: WorkshopData: Record \\"Workshop Data\\"; WorkshopData.Description := ...;\n\nHINT: Compare RecordRef.Field(2).Value vs typed WorkshopData.Description. Run a 10 000-row loop with each — time the difference. RecordRef is 3–5x slower.'),
|
|
1101
|
+
exercises=[35],
|
|
1102
|
+
)
|
|
1103
|
+
class PatternRecordRefUnnecessary:
|
|
1104
|
+
_RE = re.compile(r'\bRecRef\s*:\s*RecordRef\b|\bFldRef\s*:\s*FieldRef\b', re.MULTILINE)
|
|
1105
|
+
|
|
1106
|
+
@staticmethod
|
|
1107
|
+
def detect(text: str) -> list[dict]:
|
|
1108
|
+
return _findings(text, PatternRecordRefUnnecessary._RE,
|
|
1109
|
+
lambda m: "RecordRef/FieldRef — consider typed Record variable if table is known at compile time")
|
|
1110
|
+
|
|
1111
|
+
@staticmethod
|
|
1112
|
+
def fix(text: str) -> str:
|
|
1113
|
+
return text
|
|
1114
|
+
|
|
1115
|
+
|
|
1116
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1117
|
+
# PATTERN 31 — ModifyAll with RunTrigger=true
|
|
1118
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1119
|
+
@_register(
|
|
1120
|
+
id="MODIFYALL_RUNTRIGGER_TRUE",
|
|
1121
|
+
group="Bulk Operations",
|
|
1122
|
+
severity="HIGH",
|
|
1123
|
+
title="ModifyAll with RunTrigger=true fires OnModify trigger per row",
|
|
1124
|
+
description=('ModifyAll() with RunTrigger=true checks for OnAfterModify subscribers. If ANY subscriber is bound, ModifyAll falls back to N individual Modify() calls — one per record — each triggering the subscriber. 10 000 records × 1 Modify() call = 10 000 SQL UPDATE round-trips.\n\nSQL IMPACT: With RunTrigger=true + active subscriber: N × UPDATE per row.\nWith RunTrigger=false: 1 × UPDATE ... WHERE ... (single SQL statement).\n\nBAD: Record.ModifyAll(Field, Value, true);\nGOOD: Record.ModifyAll(Field, Value, false);\n\nHINT: Bind the subscriber and run ModifyAll with RunTrigger=true. SQL Profiler: count UPDATE statements — should be N rows. Change to RunTrigger=false: now count is 1 UPDATE statement.'),
|
|
1125
|
+
exercises=[37],
|
|
1126
|
+
)
|
|
1127
|
+
class PatternModifyAllRunTrigger:
|
|
1128
|
+
_RE = re.compile(r'\w+\.ModifyAll\([^)]+,\s*true\)', re.MULTILINE)
|
|
1129
|
+
|
|
1130
|
+
@staticmethod
|
|
1131
|
+
def detect(text: str) -> list[dict]:
|
|
1132
|
+
return _findings(text, PatternModifyAllRunTrigger._RE,
|
|
1133
|
+
lambda m: "ModifyAll with RunTrigger=true fires OnModify per row — use false unless required")
|
|
1134
|
+
|
|
1135
|
+
@staticmethod
|
|
1136
|
+
def fix(text: str) -> str:
|
|
1137
|
+
return re.sub(
|
|
1138
|
+
r'(\w+\.ModifyAll\([^)]+,\s*)true(\))',
|
|
1139
|
+
r'\1false\2',
|
|
1140
|
+
text
|
|
1141
|
+
)
|
|
1142
|
+
|
|
1143
|
+
|
|
1144
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1145
|
+
# PATTERN 32 — Missing Database.SelectLatestVersion in multi-pass loop
|
|
1146
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1147
|
+
@_register(
|
|
1148
|
+
id="MISSING_SELECTLATESTVERSION",
|
|
1149
|
+
group="Stale Reads",
|
|
1150
|
+
severity="MEDIUM",
|
|
1151
|
+
title="Multi-pass read loop without Database.SelectLatestVersion()",
|
|
1152
|
+
description=('BC NST caches SQL query results in-session. Repeated FindSet calls with the same filter return CACHED rows — no SQL executed after pass 1. A multi-pass pipeline reading the same filter silently returns stale data from pass 1 for passes 2–N if data changed concurrently.\n\nSQL IMPACT: Pass 1: SELECT ... (real SQL).\nPass 2–N: [NST cache hit] → no SQL, no awareness of concurrent updates.\n\nGOOD: foreach Pass in Passes do begin\n Database.SelectLatestVersion(); // Flushes non-locked session cache\n if Record.FindSet() then ...\n\nHINT: Run the pipeline twice: with and without SelectLatestVersion. Without flush: 0 SQL queries for passes 2–N (cache hit — stale data).'),
|
|
1153
|
+
exercises=[38],
|
|
1154
|
+
)
|
|
1155
|
+
class PatternMissingSelectLatestVersion:
|
|
1156
|
+
@staticmethod
|
|
1157
|
+
def detect(text: str) -> list[dict]:
|
|
1158
|
+
return [] # Too context-specific; covered by FIX comment detection
|
|
1159
|
+
|
|
1160
|
+
@staticmethod
|
|
1161
|
+
def fix(text: str) -> str:
|
|
1162
|
+
return text
|
|
1163
|
+
|
|
1164
|
+
|
|
1165
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1166
|
+
# PATTERN 33 — OR chain instead of case true of (3+ conditions)
|
|
1167
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1168
|
+
@_register(
|
|
1169
|
+
id="OR_CHAIN_USE_CASE_TRUE",
|
|
1170
|
+
group="Short-Circuit Evaluation",
|
|
1171
|
+
severity="MEDIUM",
|
|
1172
|
+
title="3+ OR conditions — use 'case true of' for short-circuit evaluation",
|
|
1173
|
+
description=('AL evaluates ALL operands of or before returning — even if the first operand is already true. Three expensive eligibility checks joined with or each execute a CalcSums or FindSet query — all three, every time.\n\nSQL IMPACT: 3 SQL queries per customer: CalcSums + IsEmpty + Count.\nEven when the first check already returns true — wasted 2 queries.\ncase true of with comma-separated conditions short-circuits at first true.\n\nBAD: if IsOverCreditLimit(No) or HasBlockedItems(No) or HasOverdueInvoices(No) then ...\nGOOD: case true of\n IsOverCreditLimit(No), HasBlockedItems(No), HasOverdueInvoices(No):\n exit(false);\n end;\n\nHINT: Add a counter inside each validation function. With or: all three counters increment for every customer. With case true of: only 1–2 counters increment when first is true.'),
|
|
1174
|
+
exercises=[39],
|
|
1175
|
+
)
|
|
1176
|
+
class PatternOrChainCaseTrue:
|
|
1177
|
+
_RE = re.compile(r'\bif\b[^;]+\bor\b[^;]+\bor\b[^;]+\bthen\b', re.MULTILINE | re.IGNORECASE)
|
|
1178
|
+
|
|
1179
|
+
@staticmethod
|
|
1180
|
+
def detect(text: str) -> list[dict]:
|
|
1181
|
+
findings = []
|
|
1182
|
+
for m in PatternOrChainCaseTrue._RE.finditer(text):
|
|
1183
|
+
line = _find_line(text, m.start())
|
|
1184
|
+
line_text = text.splitlines()[line-1].strip()
|
|
1185
|
+
if line_text.startswith('//'):
|
|
1186
|
+
continue
|
|
1187
|
+
# Count function calls in the OR chain
|
|
1188
|
+
if len(re.findall(r'\w+\(', m.group(0))) >= 3:
|
|
1189
|
+
findings.append({
|
|
1190
|
+
"line": line,
|
|
1191
|
+
"snippet": m.group(0)[:120],
|
|
1192
|
+
"message": "3+ OR conditions with function calls — use 'case true of' for short-circuit"
|
|
1193
|
+
})
|
|
1194
|
+
return findings
|
|
1195
|
+
|
|
1196
|
+
@staticmethod
|
|
1197
|
+
def fix(text: str) -> str:
|
|
1198
|
+
return text
|
|
1199
|
+
|
|
1200
|
+
|
|
1201
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1202
|
+
# PATTERN 34 — LockTable + ReadIsolation UpdLock (Ex42)
|
|
1203
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1204
|
+
@_register(
|
|
1205
|
+
id="LOCKTABLE_USE_UPDLOCK",
|
|
1206
|
+
group="Locking",
|
|
1207
|
+
severity="MEDIUM",
|
|
1208
|
+
title="LockTable() — consider ReadIsolation := UpdLock + FindSet(true) instead",
|
|
1209
|
+
description=('LockTable() acquires a table-level Exclusive (X) lock on the ENTIRE table. Every concurrent session — reads, analytics, order entry — blocks for the full transaction duration. A batch updating 1 000 rows can block all other sessions for seconds.\n\nSQL IMPACT: LockTable: X-lock on entire table — held for full transaction.\nReadIsolation := UpdLock + FindSet(true): acquires update locks only on rows actually read, allowing concurrent readers.\n\nBAD: Record.LockTable();\n if Record.FindSet() then\nGOOD: Record.ReadIsolation := IsolationLevel::UpdLock;\n if Record.FindSet(true) then\n\nHINT: Open two BC sessions simultaneously. Session 1: run LockTable. Session 2: try any read — it blocks until Session 1 commits. With UpdLock: Session 2 reads freely.'),
|
|
1210
|
+
exercises=[42],
|
|
1211
|
+
)
|
|
1212
|
+
class PatternLockTableUseUpdLock:
|
|
1213
|
+
_RE = re.compile(r'(\w+)\.LockTable\(\)', re.MULTILINE)
|
|
1214
|
+
|
|
1215
|
+
@staticmethod
|
|
1216
|
+
def detect(text: str) -> list[dict]:
|
|
1217
|
+
return _findings(text, PatternLockTableUseUpdLock._RE,
|
|
1218
|
+
lambda m: f"Consider replacing '{m.group(1)}.LockTable()' with ReadIsolation := UpdLock + FindSet(true)")
|
|
1219
|
+
|
|
1220
|
+
@staticmethod
|
|
1221
|
+
def fix(text: str) -> str:
|
|
1222
|
+
def replace(m):
|
|
1223
|
+
var = m.group(1)
|
|
1224
|
+
pos = m.end()
|
|
1225
|
+
ahead = text[pos:pos+200]
|
|
1226
|
+
if re.search(rf'\b{re.escape(var)}\.FindSet\(\)', ahead):
|
|
1227
|
+
replacement = f'{var}.ReadIsolation := IsolationLevel::UpdLock'
|
|
1228
|
+
# Also fix the FindSet in one pass
|
|
1229
|
+
return replacement
|
|
1230
|
+
return m.group(0)
|
|
1231
|
+
result = PatternLockTableUseUpdLock._RE.sub(replace, text)
|
|
1232
|
+
result = re.sub(r'(\w+)\.ReadIsolation := IsolationLevel::UpdLock;\s*\n(\s+)if \1\.FindSet\(\)',
|
|
1233
|
+
r'\1.ReadIsolation := IsolationLevel::UpdLock;\n\2if \1.FindSet(true)', result)
|
|
1234
|
+
return result
|
|
1235
|
+
|
|
1236
|
+
|
|
1237
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1238
|
+
# PATTERN 35 — true in [...] condition order (cheapest first)
|
|
1239
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1240
|
+
@_register(
|
|
1241
|
+
id="CONDITION_ORDER_TRUE_IN",
|
|
1242
|
+
group="Short-Circuit Evaluation",
|
|
1243
|
+
severity="LOW",
|
|
1244
|
+
title="'if true in [...]' — put cheapest condition first for best short-circuit",
|
|
1245
|
+
description=("AL's in [...] operator DOES short-circuit — unlike or/\x07nd. But placing the most expensive check FIRST defeats the benefit: the CalcSums fires before the cheap blacklist Get() is even tested. Rule: always order conditions cheapest-first in in [...] lists.\n\nSQL IMPACT: Expensive-first: CalcSums runs for ~100% of customers.\nCheap-first: CalcSums skipped for the ~35% caught by cheaper checks first.\n\nBAD: if true in [HasExceededAnnualBudget(No), IsBlacklisted(No)] then ...\nGOOD: if true in [IsBlacklisted(No), HasExceededAnnualBudget(No)] then ...\n\nHINT: Add a Message() counter inside HasExceededAnnualBudget. Run with expensive-first: counter = total customer count. Reorder to cheap-first: counter drops by ~35%."),
|
|
1246
|
+
exercises=[44],
|
|
1247
|
+
)
|
|
1248
|
+
class PatternConditionOrderTrueIn:
|
|
1249
|
+
_RE = re.compile(r'if true in \[', re.MULTILINE | re.IGNORECASE)
|
|
1250
|
+
|
|
1251
|
+
@staticmethod
|
|
1252
|
+
def detect(text: str) -> list[dict]:
|
|
1253
|
+
return _findings(text, PatternConditionOrderTrueIn._RE,
|
|
1254
|
+
lambda m: "Review condition order: put cheapest check first for best short-circuit performance")
|
|
1255
|
+
|
|
1256
|
+
@staticmethod
|
|
1257
|
+
def fix(text: str) -> str:
|
|
1258
|
+
return text
|
|
1259
|
+
|
|
1260
|
+
|
|
1261
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1262
|
+
# PATTERN 36 — N+1 nested FindSet inside repeat..until loop (Ex 27 / 43)
|
|
1263
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1264
|
+
@_register(
|
|
1265
|
+
id="NESTED_FINDSET_N_PLUS_ONE",
|
|
1266
|
+
group="Data Transfer",
|
|
1267
|
+
severity="HIGH",
|
|
1268
|
+
title="Nested FindSet/FindFirst inside repeat..until loop (N+1 queries)",
|
|
1269
|
+
description=(
|
|
1270
|
+
"For each row in the outer FindSet, an inner FindSet on a different variable fires a new SQL query. "
|
|
1271
|
+
"With 1 000 outer items: 1 outer SELECT + 1 000 inner SELECTs = 1 001 SQL round-trips. "
|
|
1272
|
+
"A Query object with GROUP BY does the same work in a single SQL query.\n\n"
|
|
1273
|
+
"SQL IMPACT: 1 000 items × 1 inner query = 1 001 total SQL round-trips.\n"
|
|
1274
|
+
"Query object: 1 SQL query with GROUP BY — result set = N groups only.\n\n"
|
|
1275
|
+
"BAD: if Items.FindSet() then repeat\n"
|
|
1276
|
+
" SalesLines.SetRange(\"No.\", Items.\"No.\");\n"
|
|
1277
|
+
" if SalesLines.FindSet() then repeat ... until SalesLines.Next() = 0;\n"
|
|
1278
|
+
" until Items.Next() = 0;\n"
|
|
1279
|
+
"GOOD: var AnalysisQuery: Query \"Workshop Item Analysis\";\n"
|
|
1280
|
+
" if AnalysisQuery.Open() then\n"
|
|
1281
|
+
" while AnalysisQuery.Read() do ...\n\n"
|
|
1282
|
+
"HINT: Count SQL queries in Profiler for the nested loop. Each outer row fires 1 inner SQL query. "
|
|
1283
|
+
"Query object version: 1 SQL query with GROUP BY regardless of data volume."
|
|
1284
|
+
),
|
|
1285
|
+
exercises=[27, 43],
|
|
1286
|
+
)
|
|
1287
|
+
class PatternNestedFindSetNPlusOne:
|
|
1288
|
+
@staticmethod
|
|
1289
|
+
def detect(text: str) -> list[dict]:
|
|
1290
|
+
findings = []
|
|
1291
|
+
lines = text.splitlines()
|
|
1292
|
+
outer_var: str | None = None
|
|
1293
|
+
in_loop = False
|
|
1294
|
+
|
|
1295
|
+
for i, line in enumerate(lines):
|
|
1296
|
+
stripped = line.strip()
|
|
1297
|
+
if stripped.startswith('//'):
|
|
1298
|
+
continue
|
|
1299
|
+
|
|
1300
|
+
# Track outer FindSet before a repeat
|
|
1301
|
+
m_outer = re.search(r'(\w+)\.(FindSet|FindFirst)\(', line)
|
|
1302
|
+
if m_outer and not in_loop:
|
|
1303
|
+
outer_var = m_outer.group(1)
|
|
1304
|
+
|
|
1305
|
+
if re.match(r'^repeat\b', stripped, re.IGNORECASE) and outer_var:
|
|
1306
|
+
in_loop = True
|
|
1307
|
+
|
|
1308
|
+
if in_loop:
|
|
1309
|
+
m_inner = re.search(r'(\w+)\.(FindSet|FindFirst)\(', line)
|
|
1310
|
+
if m_inner and m_inner.group(1) != outer_var:
|
|
1311
|
+
findings.append({
|
|
1312
|
+
"line": i + 1,
|
|
1313
|
+
"snippet": line.strip()[:120],
|
|
1314
|
+
"message": (
|
|
1315
|
+
f"Nested {m_inner.group(2)}() on '{m_inner.group(1)}' inside outer "
|
|
1316
|
+
f"'{outer_var}' FindSet loop — N+1 SQL queries. "
|
|
1317
|
+
"Consider a Query object with GROUP BY."
|
|
1318
|
+
),
|
|
1319
|
+
})
|
|
1320
|
+
|
|
1321
|
+
if re.match(r'^until\s+\w+\.Next\(\)', stripped, re.IGNORECASE):
|
|
1322
|
+
in_loop = False
|
|
1323
|
+
outer_var = None
|
|
1324
|
+
|
|
1325
|
+
return findings
|
|
1326
|
+
|
|
1327
|
+
@staticmethod
|
|
1328
|
+
def fix(text: str) -> str:
|
|
1329
|
+
return text # Structural change required — no auto-fix
|
|
1330
|
+
|
|
1331
|
+
|
|
1332
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1333
|
+
# PATTERN 37 — AutoIncrement = true disables SQL batch INSERT (Ex 36)
|
|
1334
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1335
|
+
@_register(
|
|
1336
|
+
id="AUTOINCREMENT_DISABLES_BULK_INSERT",
|
|
1337
|
+
group="Bulk Operations",
|
|
1338
|
+
severity="HIGH",
|
|
1339
|
+
title="AutoIncrement = true on PK disables SQL batch INSERT",
|
|
1340
|
+
description=(
|
|
1341
|
+
"SQL Server IDENTITY (AutoIncrement = true) requires SCOPE_IDENTITY() to be returned "
|
|
1342
|
+
"after each INSERT — this prevents batch INSERT entirely. "
|
|
1343
|
+
"For 10 000 count sheet lines: 10 000 individual SQL INSERTs, one per row. "
|
|
1344
|
+
"Manual PK assignment via NumberSequence allows SQL Server to batch rows into one trip.\n\n"
|
|
1345
|
+
"SQL IMPACT: AutoIncrement: 10 000 × INSERT (+ SCOPE_IDENTITY per row).\n"
|
|
1346
|
+
"Manual PK with NumberSequence: ~10 batch INSERT statements — orders of magnitude faster.\n\n"
|
|
1347
|
+
"BAD: field(1; Id; Integer) { AutoIncrement = true; }\n"
|
|
1348
|
+
"GOOD: field(1; Id; Integer) { }\n"
|
|
1349
|
+
" // In code:\n"
|
|
1350
|
+
" Entry.Id := NumberSequence.Next('WS_COUNT_SEQ');\n"
|
|
1351
|
+
" Entry.Insert(false); // Batchable — no identity return needed\n\n"
|
|
1352
|
+
"HINT: Insert 10 000 rows into both tables in SQL Profiler. "
|
|
1353
|
+
"AutoIncrement table: 10 000 individual INSERT statements. "
|
|
1354
|
+
"Manual key table: ~10 batch INSERT statements total."
|
|
1355
|
+
),
|
|
1356
|
+
exercises=[36],
|
|
1357
|
+
)
|
|
1358
|
+
class PatternAutoIncrementBulkInsert:
|
|
1359
|
+
_RE = re.compile(r'AutoIncrement\s*=\s*true', re.IGNORECASE)
|
|
1360
|
+
|
|
1361
|
+
@staticmethod
|
|
1362
|
+
def detect(text: str) -> list[dict]:
|
|
1363
|
+
return _findings(
|
|
1364
|
+
text,
|
|
1365
|
+
PatternAutoIncrementBulkInsert._RE,
|
|
1366
|
+
lambda m: (
|
|
1367
|
+
"AutoIncrement = true requires SCOPE_IDENTITY() per INSERT — prevents SQL batch inserts. "
|
|
1368
|
+
"Remove AutoIncrement and use NumberSequence.Next() for PK assignment."
|
|
1369
|
+
),
|
|
1370
|
+
)
|
|
1371
|
+
|
|
1372
|
+
@staticmethod
|
|
1373
|
+
def fix(text: str) -> str:
|
|
1374
|
+
return text # Requires table redesign + code change — no auto-fix
|
|
1375
|
+
|
|
1376
|
+
|
|
1377
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1378
|
+
# PATTERN 38 — AL-side GROUP BY aggregation (Ex 43)
|
|
1379
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1380
|
+
@_register(
|
|
1381
|
+
id="AL_SIDE_AGGREGATION",
|
|
1382
|
+
group="Aggregation",
|
|
1383
|
+
severity="HIGH",
|
|
1384
|
+
title="AL-side GROUP BY aggregation — push to SQL with a Query object",
|
|
1385
|
+
description=(
|
|
1386
|
+
"Manual AL aggregation: FindSet fetches ALL rows into NST, accumulates sums per group in AL. "
|
|
1387
|
+
"For 100 000 entries — 100 000 rows transferred to NST memory. "
|
|
1388
|
+
"A Query object with Method = Sum pushes GROUP BY and SUM() to SQL Server. "
|
|
1389
|
+
"SQL returns only N rows (one per group) — 99 990 rows never leave the database.\n\n"
|
|
1390
|
+
"SQL IMPACT: AL loop: SELECT all 100 000 rows, SUM in NST memory.\n"
|
|
1391
|
+
"Query: SELECT Location, SUM(Amount) GROUP BY Location → 10 rows only.\n\n"
|
|
1392
|
+
"BAD: if WorkshopData.FindSet() then repeat\n"
|
|
1393
|
+
" TotalByLocation.Add(WorkshopData.\"Location Code\", WorkshopData.Amount);\n"
|
|
1394
|
+
" until WorkshopData.Next() = 0;\n"
|
|
1395
|
+
"GOOD: var RevenueQuery: Query \"WS Location Revenue\";\n"
|
|
1396
|
+
" if RevenueQuery.Open() then\n"
|
|
1397
|
+
" while RevenueQuery.Read() do\n"
|
|
1398
|
+
" ProcessSummary(RevenueQuery.Location_Code, RevenueQuery.Sum_Line_Amount);\n\n"
|
|
1399
|
+
"HINT: Run the manual loop on 50 000 rows. Check SQL Profiler: count SELECT rows returned. "
|
|
1400
|
+
"Then switch to the Query version. Profiler shows 1 query returning only N rows. "
|
|
1401
|
+
"Duration difference is dramatic at scale."
|
|
1402
|
+
),
|
|
1403
|
+
exercises=[43],
|
|
1404
|
+
)
|
|
1405
|
+
class PatternAlSideAggregation:
|
|
1406
|
+
# Detect FindSet loop that accumulates into a Dictionary by group key
|
|
1407
|
+
_RE = re.compile(
|
|
1408
|
+
r'FindSet\s*\([^)]*\).*?repeat.*?\.Add\s*\(',
|
|
1409
|
+
re.IGNORECASE | re.DOTALL,
|
|
1410
|
+
)
|
|
1411
|
+
|
|
1412
|
+
@staticmethod
|
|
1413
|
+
def detect(text: str) -> list[dict]:
|
|
1414
|
+
findings = []
|
|
1415
|
+
for m in PatternAlSideAggregation._RE.finditer(text):
|
|
1416
|
+
line = _find_line(text, m.start())
|
|
1417
|
+
snippet = text[m.start(): m.start() + 80].split('\n')[0].strip()
|
|
1418
|
+
findings.append({
|
|
1419
|
+
"line": line,
|
|
1420
|
+
"message": (
|
|
1421
|
+
"AL-side GROUP BY aggregation — fetches all rows to NST. "
|
|
1422
|
+
"Use a Query object with Method = Sum to push GROUP BY to SQL Server."
|
|
1423
|
+
),
|
|
1424
|
+
"snippet": snippet,
|
|
1425
|
+
})
|
|
1426
|
+
return findings
|
|
1427
|
+
|
|
1428
|
+
@staticmethod
|
|
1429
|
+
def fix(text: str) -> str:
|
|
1430
|
+
return text # Structural change required — no auto-fix
|
|
1431
|
+
|
|
1432
|
+
|
|
1433
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1434
|
+
# Utility helpers
|
|
1435
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1436
|
+
|
|
1437
|
+
def _scan_file(path: Path) -> list[dict]:
|
|
1438
|
+
"""Run all detectors on a single AL file. Returns list of finding dicts."""
|
|
1439
|
+
try:
|
|
1440
|
+
text = path.read_text(encoding='utf-8-sig')
|
|
1441
|
+
except Exception as e:
|
|
1442
|
+
return [{"pattern": "READ_ERROR", "file": str(path), "line": 0, "snippet": str(e), "message": "Could not read file"}]
|
|
1443
|
+
|
|
1444
|
+
findings = []
|
|
1445
|
+
for p in PATTERNS:
|
|
1446
|
+
for f in p["detector"](text):
|
|
1447
|
+
findings.append({
|
|
1448
|
+
"pattern": p["id"],
|
|
1449
|
+
"severity": p["severity"],
|
|
1450
|
+
"title": p["title"],
|
|
1451
|
+
"file": str(path),
|
|
1452
|
+
**f
|
|
1453
|
+
})
|
|
1454
|
+
return findings
|
|
1455
|
+
|
|
1456
|
+
|
|
1457
|
+
def _fix_file(path: Path) -> tuple[str, list[str]]:
|
|
1458
|
+
"""Apply all fixers to a single AL file. Returns (new_text, list_of_applied_fixes)."""
|
|
1459
|
+
try:
|
|
1460
|
+
text = path.read_text(encoding='utf-8-sig')
|
|
1461
|
+
except Exception as e:
|
|
1462
|
+
return "", [f"READ_ERROR: {e}"]
|
|
1463
|
+
|
|
1464
|
+
applied = []
|
|
1465
|
+
original = text
|
|
1466
|
+
for p in PATTERNS:
|
|
1467
|
+
new_text = p["fixer"](text)
|
|
1468
|
+
if new_text != text:
|
|
1469
|
+
applied.append(p["id"])
|
|
1470
|
+
text = new_text
|
|
1471
|
+
|
|
1472
|
+
return text, applied
|
|
1473
|
+
|
|
1474
|
+
|
|
1475
|
+
def _al_files(folder: Path) -> list[Path]:
|
|
1476
|
+
return sorted(folder.rglob("*.al"))
|
|
1477
|
+
|
|
1478
|
+
|
|
1479
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1480
|
+
# MCP Tools
|
|
1481
|
+
# ───────────────────────────────────────────────────────────────────────
|
|
1482
|
+
|
|
1483
|
+
@mcp.tool()
|
|
1484
|
+
def list_patterns() -> str:
|
|
1485
|
+
"""
|
|
1486
|
+
List all known AL performance anti-patterns with IDs, severity, and short descriptions.
|
|
1487
|
+
Use this to understand what the analyzer can detect before running a scan.
|
|
1488
|
+
"""
|
|
1489
|
+
lines = ["# AL Performance Patterns\n"]
|
|
1490
|
+
groups: dict[str, list] = {}
|
|
1491
|
+
for p in PATTERNS:
|
|
1492
|
+
groups.setdefault(p["group"], []).append(p)
|
|
1493
|
+
|
|
1494
|
+
for group, items in sorted(groups.items()):
|
|
1495
|
+
lines.append(f"\n## {group}\n")
|
|
1496
|
+
for p in items:
|
|
1497
|
+
lines.append(f"- **[{p['severity']}]** `{p['id']}` \n {p['title']} \n Exercises: {p['exercises']}\n")
|
|
1498
|
+
|
|
1499
|
+
return "\n".join(lines)
|
|
1500
|
+
|
|
1501
|
+
|
|
1502
|
+
@mcp.tool()
|
|
1503
|
+
def explain_pattern(pattern_id: str) -> str:
|
|
1504
|
+
"""
|
|
1505
|
+
Get a full explanation of a specific performance pattern including examples and the fix.
|
|
1506
|
+
|
|
1507
|
+
Args:
|
|
1508
|
+
pattern_id: The pattern ID (e.g. 'MISSING_SETLOADFIELDS'). Use list_patterns() to see all IDs.
|
|
1509
|
+
"""
|
|
1510
|
+
for p in PATTERNS:
|
|
1511
|
+
if p["id"].upper() == pattern_id.upper():
|
|
1512
|
+
return (
|
|
1513
|
+
f"# {p['title']}\n\n"
|
|
1514
|
+
f"**ID:** `{p['id']}` \n"
|
|
1515
|
+
f"**Severity:** {p['severity']} \n"
|
|
1516
|
+
f"**Category:** {p['group']} \n"
|
|
1517
|
+
f"**Workshop Exercises:** {p['exercises']}\n\n"
|
|
1518
|
+
f"{p['description']}"
|
|
1519
|
+
)
|
|
1520
|
+
ids = ", ".join(p["id"] for p in PATTERNS)
|
|
1521
|
+
return f"Pattern '{pattern_id}' not found. Known IDs: {ids}"
|
|
1522
|
+
|
|
1523
|
+
|
|
1524
|
+
@mcp.tool()
|
|
1525
|
+
def scan_al_workspace(
|
|
1526
|
+
folder_path: str,
|
|
1527
|
+
severity_filter: str = "ALL",
|
|
1528
|
+
group_filter: str = "ALL",
|
|
1529
|
+
) -> str:
|
|
1530
|
+
"""
|
|
1531
|
+
Scan all AL files in a folder (recursively) for performance anti-patterns.
|
|
1532
|
+
Returns a structured report of findings grouped by file.
|
|
1533
|
+
|
|
1534
|
+
Args:
|
|
1535
|
+
folder_path: Absolute path to the folder containing AL source files.
|
|
1536
|
+
severity_filter: Filter by severity: HIGH, MEDIUM, LOW, or ALL (default ALL).
|
|
1537
|
+
group_filter: Filter by pattern group name or ALL (default ALL).
|
|
1538
|
+
"""
|
|
1539
|
+
folder = Path(folder_path)
|
|
1540
|
+
if not folder.exists():
|
|
1541
|
+
return f"ERROR: Folder not found: {folder_path}"
|
|
1542
|
+
|
|
1543
|
+
files = _al_files(folder)
|
|
1544
|
+
if not files:
|
|
1545
|
+
return f"No .al files found in {folder_path}"
|
|
1546
|
+
|
|
1547
|
+
all_findings: list[dict] = []
|
|
1548
|
+
for f in files:
|
|
1549
|
+
all_findings.extend(_scan_file(f))
|
|
1550
|
+
|
|
1551
|
+
# Apply filters
|
|
1552
|
+
if severity_filter.upper() != "ALL":
|
|
1553
|
+
all_findings = [f for f in all_findings if f["severity"].upper() == severity_filter.upper()]
|
|
1554
|
+
if group_filter.upper() != "ALL":
|
|
1555
|
+
all_findings = [f for f in all_findings if
|
|
1556
|
+
any(p["group"].upper() == group_filter.upper()
|
|
1557
|
+
for p in PATTERNS if p["id"] == f["pattern"])]
|
|
1558
|
+
|
|
1559
|
+
if not all_findings:
|
|
1560
|
+
return f"✅ No issues found ({len(files)} files scanned)."
|
|
1561
|
+
|
|
1562
|
+
# Group by file
|
|
1563
|
+
by_file: dict[str, list] = {}
|
|
1564
|
+
for f in all_findings:
|
|
1565
|
+
by_file.setdefault(f["file"], []).append(f)
|
|
1566
|
+
|
|
1567
|
+
severity_order = {"HIGH": 0, "MEDIUM": 1, "LOW": 2}
|
|
1568
|
+
total = len(all_findings)
|
|
1569
|
+
high = sum(1 for f in all_findings if f["severity"] == "HIGH")
|
|
1570
|
+
medium = sum(1 for f in all_findings if f["severity"] == "MEDIUM")
|
|
1571
|
+
low = sum(1 for f in all_findings if f["severity"] == "LOW")
|
|
1572
|
+
|
|
1573
|
+
lines = [
|
|
1574
|
+
f"# AL Performance Scan Results\n",
|
|
1575
|
+
f"**Folder:** `{folder_path}` ",
|
|
1576
|
+
f"**Files scanned:** {len(files)} ",
|
|
1577
|
+
f"**Issues found:** {total} ({high} HIGH, {medium} MEDIUM, {low} LOW)\n",
|
|
1578
|
+
]
|
|
1579
|
+
|
|
1580
|
+
for filepath, findings in sorted(by_file.items()):
|
|
1581
|
+
rel = Path(filepath).relative_to(folder) if Path(filepath).is_relative_to(folder) else Path(filepath).name
|
|
1582
|
+
lines.append(f"\n## `{rel}`\n")
|
|
1583
|
+
findings_sorted = sorted(findings, key=lambda x: severity_order.get(x["severity"], 9))
|
|
1584
|
+
for f in findings_sorted:
|
|
1585
|
+
sev_icon = {"HIGH": "🔴", "MEDIUM": "🟡", "LOW": "🔵"}.get(f["severity"], "⚪")
|
|
1586
|
+
lines.append(f"- {sev_icon} **L{f['line']}** `{f['pattern']}`: {f['message']}")
|
|
1587
|
+
if f.get("snippet"):
|
|
1588
|
+
lines.append(f" ```al\n {f['snippet']}\n ```")
|
|
1589
|
+
|
|
1590
|
+
return "\n".join(lines)
|
|
1591
|
+
|
|
1592
|
+
|
|
1593
|
+
@mcp.tool()
|
|
1594
|
+
def fix_al_file(
|
|
1595
|
+
file_path: str,
|
|
1596
|
+
dry_run: bool = True,
|
|
1597
|
+
) -> str:
|
|
1598
|
+
"""
|
|
1599
|
+
Apply all available automatic fixes to a single AL file.
|
|
1600
|
+
|
|
1601
|
+
Args:
|
|
1602
|
+
file_path: Absolute path to the .al file to fix.
|
|
1603
|
+
dry_run: If True (default), show what would change without writing. Set False to write.
|
|
1604
|
+
"""
|
|
1605
|
+
path = Path(file_path)
|
|
1606
|
+
if not path.exists():
|
|
1607
|
+
return f"ERROR: File not found: {file_path}"
|
|
1608
|
+
|
|
1609
|
+
original = path.read_text(encoding='utf-8-sig')
|
|
1610
|
+
new_text, applied = _fix_file(path)
|
|
1611
|
+
|
|
1612
|
+
if not applied:
|
|
1613
|
+
return f"✅ No automatic fixes applicable to `{path.name}`."
|
|
1614
|
+
|
|
1615
|
+
lines = [f"# Fix Report: `{path.name}`\n"]
|
|
1616
|
+
lines.append(f"**Fixes applied:** {', '.join(applied)}\n")
|
|
1617
|
+
|
|
1618
|
+
if dry_run:
|
|
1619
|
+
lines.append("**Mode:** DRY RUN — no file written. Set dry_run=False to apply.\n")
|
|
1620
|
+
# Show diff summary
|
|
1621
|
+
orig_lines = original.splitlines()
|
|
1622
|
+
new_lines = new_text.splitlines()
|
|
1623
|
+
changes = 0
|
|
1624
|
+
for i, (o, n) in enumerate(zip(orig_lines, new_lines)):
|
|
1625
|
+
if o != n:
|
|
1626
|
+
lines.append(f"L{i+1}: `{o.strip()}` → `{n.strip()}`")
|
|
1627
|
+
changes += 1
|
|
1628
|
+
if changes >= 20:
|
|
1629
|
+
lines.append(f"... (and more)")
|
|
1630
|
+
break
|
|
1631
|
+
else:
|
|
1632
|
+
path.write_text(new_text, encoding='utf-8-sig')
|
|
1633
|
+
lines.append(f"✅ File written: `{file_path}`")
|
|
1634
|
+
|
|
1635
|
+
return "\n".join(lines)
|
|
1636
|
+
|
|
1637
|
+
|
|
1638
|
+
@mcp.tool()
|
|
1639
|
+
def fix_al_workspace(
|
|
1640
|
+
folder_path: str,
|
|
1641
|
+
dry_run: bool = True,
|
|
1642
|
+
) -> str:
|
|
1643
|
+
"""
|
|
1644
|
+
Apply all available automatic fixes to every AL file in a folder (recursively).
|
|
1645
|
+
|
|
1646
|
+
Args:
|
|
1647
|
+
folder_path: Absolute path to the folder containing AL source files.
|
|
1648
|
+
dry_run: If True (default), show what would change without writing. Set False to write.
|
|
1649
|
+
"""
|
|
1650
|
+
folder = Path(folder_path)
|
|
1651
|
+
if not folder.exists():
|
|
1652
|
+
return f"ERROR: Folder not found: {folder_path}"
|
|
1653
|
+
|
|
1654
|
+
files = _al_files(folder)
|
|
1655
|
+
if not files:
|
|
1656
|
+
return f"No .al files found in {folder_path}"
|
|
1657
|
+
|
|
1658
|
+
results = []
|
|
1659
|
+
total_fixes = 0
|
|
1660
|
+
for f in files:
|
|
1661
|
+
original = f.read_text(encoding='utf-8-sig')
|
|
1662
|
+
new_text, applied = _fix_file(f)
|
|
1663
|
+
if applied:
|
|
1664
|
+
total_fixes += len(applied)
|
|
1665
|
+
results.append((f, applied, original != new_text))
|
|
1666
|
+
if not dry_run and original != new_text:
|
|
1667
|
+
f.write_text(new_text, encoding='utf-8-sig')
|
|
1668
|
+
|
|
1669
|
+
if not results:
|
|
1670
|
+
return f"✅ No automatic fixes applicable in {len(files)} files."
|
|
1671
|
+
|
|
1672
|
+
mode = "DRY RUN" if dry_run else "APPLIED"
|
|
1673
|
+
lines = [
|
|
1674
|
+
f"# Fix Workspace Report [{mode}]\n",
|
|
1675
|
+
f"**Folder:** `{folder_path}` ",
|
|
1676
|
+
f"**Files with fixes:** {len(results)} of {len(files)} ",
|
|
1677
|
+
f"**Total fix operations:** {total_fixes}\n",
|
|
1678
|
+
]
|
|
1679
|
+
|
|
1680
|
+
for f, applied, changed in results:
|
|
1681
|
+
rel = f.relative_to(folder) if f.is_relative_to(folder) else f.name
|
|
1682
|
+
status = "✅ written" if (not dry_run and changed) else ("📝 would change" if changed else "⟳ no change")
|
|
1683
|
+
lines.append(f"- `{rel}` [{status}]: {', '.join(applied)}")
|
|
1684
|
+
|
|
1685
|
+
if dry_run:
|
|
1686
|
+
lines.append("\n> Set `dry_run=False` to apply all changes.")
|
|
1687
|
+
|
|
1688
|
+
return "\n".join(lines)
|
|
1689
|
+
|
|
1690
|
+
|
|
1691
|
+
@mcp.tool()
|
|
1692
|
+
def scan_al_code(
|
|
1693
|
+
al_code: str,
|
|
1694
|
+
file_hint: str = "inline",
|
|
1695
|
+
) -> str:
|
|
1696
|
+
"""
|
|
1697
|
+
Scan a snippet of AL code (pasted inline) for performance issues.
|
|
1698
|
+
Useful for checking code before committing or during code review.
|
|
1699
|
+
|
|
1700
|
+
Args:
|
|
1701
|
+
al_code: The AL code text to analyze.
|
|
1702
|
+
file_hint: Optional label for the code (e.g. the procedure name).
|
|
1703
|
+
"""
|
|
1704
|
+
findings: list[dict] = []
|
|
1705
|
+
for p in PATTERNS:
|
|
1706
|
+
for f in p["detector"](al_code):
|
|
1707
|
+
findings.append({
|
|
1708
|
+
"pattern": p["id"],
|
|
1709
|
+
"severity": p["severity"],
|
|
1710
|
+
"title": p["title"],
|
|
1711
|
+
"file": file_hint,
|
|
1712
|
+
**f
|
|
1713
|
+
})
|
|
1714
|
+
|
|
1715
|
+
if not findings:
|
|
1716
|
+
return "✅ No performance issues detected in the provided code."
|
|
1717
|
+
|
|
1718
|
+
severity_order = {"HIGH": 0, "MEDIUM": 1, "LOW": 2}
|
|
1719
|
+
findings_sorted = sorted(findings, key=lambda x: severity_order.get(x["severity"], 9))
|
|
1720
|
+
|
|
1721
|
+
lines = [f"# Performance Issues in `{file_hint}`\n"]
|
|
1722
|
+
for f in findings_sorted:
|
|
1723
|
+
sev_icon = {"HIGH": "🔴", "MEDIUM": "🟡", "LOW": "🔵"}.get(f["severity"], "⚪")
|
|
1724
|
+
lines.append(f"{sev_icon} **L{f['line']}** `{f['pattern']}` — {f['message']}")
|
|
1725
|
+
lines.append(f" > {f['title']}")
|
|
1726
|
+
if f.get("snippet"):
|
|
1727
|
+
lines.append(f" ```al\n {f['snippet']}\n ```")
|
|
1728
|
+
lines.append("")
|
|
1729
|
+
|
|
1730
|
+
return "\n".join(lines)
|
|
1731
|
+
|
|
1732
|
+
|
|
1733
|
+
# ═══════════════════════════════════════════════════════════════════════
|
|
1734
|
+
# ORCHESTRATION LAYER
|
|
1735
|
+
# ═══════════════════════════════════════════════════════════════════════
|
|
1736
|
+
#
|
|
1737
|
+
# Architecture:
|
|
1738
|
+
# analyze_al_performance(folder) ← master orchestrator
|
|
1739
|
+
# internally delegates to one function per pattern group (sub-agents)
|
|
1740
|
+
# aggregates all results into a unified priority report
|
|
1741
|
+
#
|
|
1742
|
+
# Individual group sub-agent tools also exposed so the LLM can call
|
|
1743
|
+
# them independently when the user asks about a specific category.
|
|
1744
|
+
#
|
|
1745
|
+
# ═══════════════════════════════════════════════════════════════════════
|
|
1746
|
+
|
|
1747
|
+
# ─── Internal sub-agent runner ────────────────────────────────────────
|
|
1748
|
+
|
|
1749
|
+
def _run_group_agent(group_name: str, folder: Path) -> dict:
|
|
1750
|
+
"""
|
|
1751
|
+
Run all detectors belonging to a single pattern group against every AL file.
|
|
1752
|
+
Returns a structured result dict — this is what each sub-agent produces.
|
|
1753
|
+
"""
|
|
1754
|
+
group_patterns = [p for p in PATTERNS if p["group"] == group_name]
|
|
1755
|
+
files = _al_files(folder)
|
|
1756
|
+
|
|
1757
|
+
findings: list[dict] = []
|
|
1758
|
+
for f in files:
|
|
1759
|
+
try:
|
|
1760
|
+
text = f.read_text(encoding="utf-8-sig")
|
|
1761
|
+
except Exception:
|
|
1762
|
+
continue
|
|
1763
|
+
for p in group_patterns:
|
|
1764
|
+
for finding in p["detector"](text):
|
|
1765
|
+
findings.append({
|
|
1766
|
+
"pattern": p["id"],
|
|
1767
|
+
"severity": p["severity"],
|
|
1768
|
+
"title": p["title"],
|
|
1769
|
+
"file": str(f),
|
|
1770
|
+
"rel_file": str(f.relative_to(folder)) if f.is_relative_to(folder) else f.name,
|
|
1771
|
+
**finding
|
|
1772
|
+
})
|
|
1773
|
+
|
|
1774
|
+
high = [f for f in findings if f["severity"] == "HIGH"]
|
|
1775
|
+
medium = [f for f in findings if f["severity"] == "MEDIUM"]
|
|
1776
|
+
low = [f for f in findings if f["severity"] == "LOW"]
|
|
1777
|
+
|
|
1778
|
+
# Auto-fixable patterns in this group
|
|
1779
|
+
fixable = [p["id"] for p in group_patterns if _is_pattern_auto_fixable(p["id"])]
|
|
1780
|
+
|
|
1781
|
+
return {
|
|
1782
|
+
"group": group_name,
|
|
1783
|
+
"patterns_checked": [p["id"] for p in group_patterns],
|
|
1784
|
+
"files_scanned": len(files),
|
|
1785
|
+
"total": len(findings),
|
|
1786
|
+
"high": len(high),
|
|
1787
|
+
"medium": len(medium),
|
|
1788
|
+
"low": len(low),
|
|
1789
|
+
"fixable_patterns": fixable,
|
|
1790
|
+
"findings": findings,
|
|
1791
|
+
}
|
|
1792
|
+
|
|
1793
|
+
|
|
1794
|
+
_AUTO_FIXABLE = {
|
|
1795
|
+
"FIND_DASH_BUFFER_ONE",
|
|
1796
|
+
"COUNT_NOT_ZERO",
|
|
1797
|
+
"COUNT_EQUALS_ONE",
|
|
1798
|
+
"ISEMPTY_BEFORE_FINDSET",
|
|
1799
|
+
"FINDSET_BEFORE_MODIFYALL",
|
|
1800
|
+
"FINDSET_BEFORE_DELETEALL",
|
|
1801
|
+
"MODIFYALL_RUNTRIGGER_TRUE",
|
|
1802
|
+
"MISSING_TEMPORARY",
|
|
1803
|
+
"FINDSET_MODIFY_NO_TRUE",
|
|
1804
|
+
"LOCKTABLE_USE_UPDLOCK",
|
|
1805
|
+
"FINDFIRST_IN_LOOP",
|
|
1806
|
+
}
|
|
1807
|
+
|
|
1808
|
+
def _is_pattern_auto_fixable(pattern_id: str) -> bool:
|
|
1809
|
+
return pattern_id in _AUTO_FIXABLE
|
|
1810
|
+
|
|
1811
|
+
|
|
1812
|
+
def _format_group_report(result: dict, folder: Path, detail_level: str = "summary") -> list[str]:
|
|
1813
|
+
"""Render one group sub-agent result as markdown lines."""
|
|
1814
|
+
sev_icon = "🔴" if result["high"] > 0 else ("🟡" if result["medium"] > 0 else "✅")
|
|
1815
|
+
lines = [
|
|
1816
|
+
f"\n### {sev_icon} {result['group']}",
|
|
1817
|
+
f"Found **{result['total']}** issue(s) — "
|
|
1818
|
+
f"{result['high']} HIGH, {result['medium']} MEDIUM, {result['low']} LOW",
|
|
1819
|
+
]
|
|
1820
|
+
if result["fixable_patterns"]:
|
|
1821
|
+
lines.append(f"Auto-fixable patterns: `{'`, `'.join(result['fixable_patterns'])}`")
|
|
1822
|
+
|
|
1823
|
+
if detail_level != "full" or result["total"] == 0:
|
|
1824
|
+
return lines
|
|
1825
|
+
|
|
1826
|
+
severity_order = {"HIGH": 0, "MEDIUM": 1, "LOW": 2}
|
|
1827
|
+
findings_sorted = sorted(result["findings"], key=lambda x: severity_order.get(x["severity"], 9))
|
|
1828
|
+
seen: set[str] = set()
|
|
1829
|
+
for f in findings_sorted[:15]: # cap per group
|
|
1830
|
+
key = f"{f['rel_file']}:{f['line']}:{f['pattern']}"
|
|
1831
|
+
if key in seen:
|
|
1832
|
+
continue
|
|
1833
|
+
seen.add(key)
|
|
1834
|
+
icon = {"HIGH": "🔴", "MEDIUM": "🟡", "LOW": "🔵"}.get(f["severity"], "⚪")
|
|
1835
|
+
lines.append(f" - {icon} `{f['rel_file']}` L{f['line']} `{f['pattern']}`: {f['message']}")
|
|
1836
|
+
if len(result["findings"]) > 15:
|
|
1837
|
+
lines.append(f" - _(… {len(result['findings']) - 15} more — use group sub-agent for full list)_")
|
|
1838
|
+
return lines
|
|
1839
|
+
|
|
1840
|
+
|
|
1841
|
+
# ─── Group sub-agent tools ────────────────────────────────────────────
|
|
1842
|
+
# Each exposed as its own MCP tool so the LLM can call them independently.
|
|
1843
|
+
|
|
1844
|
+
def _group_tool_impl(group_name: str, folder_path: str) -> str:
|
|
1845
|
+
folder = Path(folder_path)
|
|
1846
|
+
if not folder.exists():
|
|
1847
|
+
return f"ERROR: Folder not found: {folder_path}"
|
|
1848
|
+
result = _run_group_agent(group_name, folder)
|
|
1849
|
+
lines = [f"# Sub-Agent: {group_name}\n",
|
|
1850
|
+
f"**Folder:** `{folder_path}` ",
|
|
1851
|
+
f"**Issues:** {result['total']} ({result['high']} HIGH, {result['medium']} MEDIUM, {result['low']} LOW)\n"]
|
|
1852
|
+
lines += _format_group_report(result, folder, detail_level="full")
|
|
1853
|
+
return "\n".join(lines)
|
|
1854
|
+
|
|
1855
|
+
|
|
1856
|
+
@mcp.tool()
|
|
1857
|
+
def scan_data_transfer_issues(folder_path: str) -> str:
|
|
1858
|
+
"""
|
|
1859
|
+
Sub-agent: Scan for Data Transfer anti-patterns.
|
|
1860
|
+
Covers: missing SetLoadFields, Find('-') buffer-size-1, FindFirst in loops, FindLast in loops,
|
|
1861
|
+
SetRange+FindFirst instead of Get, SetCurrentKey missing.
|
|
1862
|
+
"""
|
|
1863
|
+
return _group_tool_impl("Data Transfer", folder_path)
|
|
1864
|
+
|
|
1865
|
+
|
|
1866
|
+
@mcp.tool()
|
|
1867
|
+
def scan_flowfield_issues(folder_path: str) -> str:
|
|
1868
|
+
"""
|
|
1869
|
+
Sub-agent: Scan for FlowField anti-patterns.
|
|
1870
|
+
Covers: CalcFields inside loops, SetFilter on FlowField (correlated subquery).
|
|
1871
|
+
"""
|
|
1872
|
+
return _group_tool_impl("FlowFields", folder_path)
|
|
1873
|
+
|
|
1874
|
+
|
|
1875
|
+
@mcp.tool()
|
|
1876
|
+
def scan_aggregation_issues(folder_path: str) -> str:
|
|
1877
|
+
"""
|
|
1878
|
+
Sub-agent: Scan for Aggregation anti-patterns.
|
|
1879
|
+
Covers: manual summation loops that should use CalcSums().
|
|
1880
|
+
"""
|
|
1881
|
+
return _group_tool_impl("Aggregation", folder_path)
|
|
1882
|
+
|
|
1883
|
+
|
|
1884
|
+
@mcp.tool()
|
|
1885
|
+
def scan_bulk_operation_issues(folder_path: str) -> str:
|
|
1886
|
+
"""
|
|
1887
|
+
Sub-agent: Scan for Bulk Operation anti-patterns.
|
|
1888
|
+
Covers: Delete in loop, FindSet before ModifyAll, FindSet before DeleteAll,
|
|
1889
|
+
ModifyAll with RunTrigger=true.
|
|
1890
|
+
"""
|
|
1891
|
+
return _group_tool_impl("Bulk Operations", folder_path)
|
|
1892
|
+
|
|
1893
|
+
|
|
1894
|
+
@mcp.tool()
|
|
1895
|
+
def scan_existence_check_issues(folder_path: str) -> str:
|
|
1896
|
+
"""
|
|
1897
|
+
Sub-agent: Scan for Existence Check anti-patterns.
|
|
1898
|
+
Covers: Count() != 0 vs IsEmpty(), redundant IsEmpty before FindSet, Count() = 1 uniqueness.
|
|
1899
|
+
"""
|
|
1900
|
+
return _group_tool_impl("Existence Checks", folder_path)
|
|
1901
|
+
|
|
1902
|
+
|
|
1903
|
+
@mcp.tool()
|
|
1904
|
+
def scan_locking_issues(folder_path: str) -> str:
|
|
1905
|
+
"""
|
|
1906
|
+
Sub-agent: Scan for Locking anti-patterns.
|
|
1907
|
+
Covers: LockTable too early, LockTable for sequence generation, DeleteAll without IsEmpty guard,
|
|
1908
|
+
LockTable vs ReadIsolation UpdLock.
|
|
1909
|
+
"""
|
|
1910
|
+
return _group_tool_impl("Locking", folder_path)
|
|
1911
|
+
|
|
1912
|
+
|
|
1913
|
+
@mcp.tool()
|
|
1914
|
+
def scan_memory_issues(folder_path: str) -> str:
|
|
1915
|
+
"""
|
|
1916
|
+
Sub-agent: Scan for Memory / Copy anti-patterns.
|
|
1917
|
+
Covers: Record parameter by value, missing 'temporary' keyword, temp table used as Dictionary,
|
|
1918
|
+
temp table used as collection, RecordRef when typed Record suffices.
|
|
1919
|
+
"""
|
|
1920
|
+
return _group_tool_impl("Memory / Copies", folder_path)
|
|
1921
|
+
|
|
1922
|
+
|
|
1923
|
+
@mcp.tool()
|
|
1924
|
+
def scan_short_circuit_issues(folder_path: str) -> str:
|
|
1925
|
+
"""
|
|
1926
|
+
Sub-agent: Scan for Short-Circuit Evaluation anti-patterns.
|
|
1927
|
+
Covers: OR/AND eager evaluation, 3+ OR conditions (use case true of),
|
|
1928
|
+
'if true in [...]' condition ordering.
|
|
1929
|
+
"""
|
|
1930
|
+
return _group_tool_impl("Short-Circuit Evaluation", folder_path)
|
|
1931
|
+
|
|
1932
|
+
|
|
1933
|
+
@mcp.tool()
|
|
1934
|
+
def scan_write_pattern_issues(folder_path: str) -> str:
|
|
1935
|
+
"""
|
|
1936
|
+
Sub-agent: Scan for Write Pattern anti-patterns.
|
|
1937
|
+
Covers: Insert-on-conflict (try Insert, Modify on fail), silent Insert failure.
|
|
1938
|
+
"""
|
|
1939
|
+
return _group_tool_impl("Write Patterns", folder_path)
|
|
1940
|
+
|
|
1941
|
+
|
|
1942
|
+
@mcp.tool()
|
|
1943
|
+
def scan_cursor_safety_issues(folder_path: str) -> str:
|
|
1944
|
+
"""
|
|
1945
|
+
Sub-agent: Scan for Cursor Safety anti-patterns.
|
|
1946
|
+
Covers: SetRange/SetFilter on active FindSet cursor (corrupts iteration),
|
|
1947
|
+
FindSet(true) missing when Modify is called on cursor variable.
|
|
1948
|
+
"""
|
|
1949
|
+
# Combine Cursor Safety + the FindSet(true) pattern
|
|
1950
|
+
return _group_tool_impl("Cursor Safety", folder_path)
|
|
1951
|
+
|
|
1952
|
+
|
|
1953
|
+
@mcp.tool()
|
|
1954
|
+
def scan_stale_read_issues(folder_path: str) -> str:
|
|
1955
|
+
"""
|
|
1956
|
+
Sub-agent: Scan for Stale Read anti-patterns.
|
|
1957
|
+
Covers: missing ReadIsolation on reporting queries, missing SelectLatestVersion in multi-pass loops.
|
|
1958
|
+
"""
|
|
1959
|
+
return _group_tool_impl("Stale Reads", folder_path)
|
|
1960
|
+
|
|
1961
|
+
|
|
1962
|
+
# ─── Master orchestrator tool ─────────────────────────────────────────
|
|
1963
|
+
|
|
1964
|
+
@mcp.tool()
|
|
1965
|
+
def analyze_al_performance(
|
|
1966
|
+
folder_path: str,
|
|
1967
|
+
include_action_plan: bool = True,
|
|
1968
|
+
) -> str:
|
|
1969
|
+
"""
|
|
1970
|
+
MASTER ORCHESTRATOR — runs all pattern-group sub-agents in sequence and produces
|
|
1971
|
+
a unified performance report with a prioritized action plan.
|
|
1972
|
+
|
|
1973
|
+
This is the primary entry point. It:
|
|
1974
|
+
1. Delegates to each pattern-group sub-agent (Data Transfer, FlowFields, Locking, etc.)
|
|
1975
|
+
2. Aggregates all findings across all groups
|
|
1976
|
+
3. Ranks files by total issue severity score
|
|
1977
|
+
4. Produces a prioritized action plan: which files to fix first and how
|
|
1978
|
+
5. Lists all auto-fixable patterns with the fix command to run
|
|
1979
|
+
|
|
1980
|
+
Args:
|
|
1981
|
+
folder_path: Absolute path to the AL workspace folder to analyze.
|
|
1982
|
+
include_action_plan: Include the prioritized fix plan (default True).
|
|
1983
|
+
"""
|
|
1984
|
+
folder = Path(folder_path)
|
|
1985
|
+
if not folder.exists():
|
|
1986
|
+
return f"ERROR: Folder not found: {folder_path}"
|
|
1987
|
+
|
|
1988
|
+
files = _al_files(folder)
|
|
1989
|
+
if not files:
|
|
1990
|
+
return f"No .al files found in {folder_path}"
|
|
1991
|
+
|
|
1992
|
+
# ── Step 1: Collect all unique group names from the pattern registry ──
|
|
1993
|
+
all_groups = sorted({p["group"] for p in PATTERNS})
|
|
1994
|
+
|
|
1995
|
+
# ── Step 2: Run each group sub-agent ──────────────────────────────────
|
|
1996
|
+
group_results: list[dict] = []
|
|
1997
|
+
for group in all_groups:
|
|
1998
|
+
result = _run_group_agent(group, folder)
|
|
1999
|
+
group_results.append(result)
|
|
2000
|
+
|
|
2001
|
+
# ── Step 3: Aggregate ─────────────────────────────────────────────────
|
|
2002
|
+
all_findings: list[dict] = []
|
|
2003
|
+
for r in group_results:
|
|
2004
|
+
all_findings.extend(r["findings"])
|
|
2005
|
+
|
|
2006
|
+
total = len(all_findings)
|
|
2007
|
+
high = sum(1 for f in all_findings if f["severity"] == "HIGH")
|
|
2008
|
+
medium = sum(1 for f in all_findings if f["severity"] == "MEDIUM")
|
|
2009
|
+
low = sum(1 for f in all_findings if f["severity"] == "LOW")
|
|
2010
|
+
score = high * 10 + medium * 3 + low # weighted severity score
|
|
2011
|
+
|
|
2012
|
+
# Files ranked by severity score
|
|
2013
|
+
file_scores: dict[str, dict] = {}
|
|
2014
|
+
for f in all_findings:
|
|
2015
|
+
fp = f["file"]
|
|
2016
|
+
if fp not in file_scores:
|
|
2017
|
+
file_scores[fp] = {"high": 0, "medium": 0, "low": 0, "patterns": set(), "rel": f["rel_file"]}
|
|
2018
|
+
file_scores[fp][f["severity"].lower()] += 1
|
|
2019
|
+
file_scores[fp]["patterns"].add(f["pattern"])
|
|
2020
|
+
|
|
2021
|
+
ranked_files = sorted(
|
|
2022
|
+
file_scores.items(),
|
|
2023
|
+
key=lambda x: x[1]["high"] * 10 + x[1]["medium"] * 3 + x[1]["low"],
|
|
2024
|
+
reverse=True
|
|
2025
|
+
)
|
|
2026
|
+
|
|
2027
|
+
# Auto-fixable findings
|
|
2028
|
+
fixable_findings = [f for f in all_findings if _is_pattern_auto_fixable(f["pattern"])]
|
|
2029
|
+
fixable_count = len(fixable_findings)
|
|
2030
|
+
fixable_files = sorted({f["rel_file"] for f in fixable_findings})
|
|
2031
|
+
|
|
2032
|
+
# ── Step 4: Build report ──────────────────────────────────────────────
|
|
2033
|
+
lines = [
|
|
2034
|
+
"# 🔍 AL Performance Analysis — Orchestrator Report\n",
|
|
2035
|
+
f"**Workspace:** `{folder_path}` ",
|
|
2036
|
+
f"**Files scanned:** {len(files)} ",
|
|
2037
|
+
f"**Total issues:** {total} (🔴 {high} HIGH, 🟡 {medium} MEDIUM, 🔵 {low} LOW) ",
|
|
2038
|
+
f"**Severity score:** {score} ",
|
|
2039
|
+
f"**Auto-fixable:** {fixable_count} issues in {len(fixable_files)} files\n",
|
|
2040
|
+
"---\n",
|
|
2041
|
+
"## Sub-Agent Results by Group\n",
|
|
2042
|
+
"| Group | HIGH | MED | LOW | Total |",
|
|
2043
|
+
"|-------|------|-----|-----|-------|",
|
|
2044
|
+
]
|
|
2045
|
+
for r in group_results:
|
|
2046
|
+
status = "🔴" if r["high"] > 0 else ("🟡" if r["medium"] > 0 else "✅")
|
|
2047
|
+
lines.append(f"| {status} {r['group']} | {r['high']} | {r['medium']} | {r['low']} | {r['total']} |")
|
|
2048
|
+
|
|
2049
|
+
# ── Top offending files ───────────────────────────────────────────────
|
|
2050
|
+
lines += ["\n---\n", "## 🏆 Files Ranked by Severity Score\n"]
|
|
2051
|
+
for i, (fp, sc) in enumerate(ranked_files[:10], 1):
|
|
2052
|
+
file_score = sc["high"] * 10 + sc["medium"] * 3 + sc["low"]
|
|
2053
|
+
patterns_str = ", ".join(f"`{p}`" for p in sorted(sc["patterns"]))
|
|
2054
|
+
lines.append(
|
|
2055
|
+
f"{i}. **`{sc['rel']}`** — score {file_score} "
|
|
2056
|
+
f"(🔴{sc['high']} 🟡{sc['medium']} 🔵{sc['low']}) \n"
|
|
2057
|
+
f" Patterns: {patterns_str}"
|
|
2058
|
+
)
|
|
2059
|
+
if len(ranked_files) > 10:
|
|
2060
|
+
lines.append(f"\n_… and {len(ranked_files) - 10} more files with issues._")
|
|
2061
|
+
|
|
2062
|
+
# ── Action plan ───────────────────────────────────────────────────────
|
|
2063
|
+
if include_action_plan:
|
|
2064
|
+
lines += ["\n---\n", "## 📋 Prioritized Action Plan\n"]
|
|
2065
|
+
|
|
2066
|
+
# Phase 1: Auto-fixable
|
|
2067
|
+
if fixable_findings:
|
|
2068
|
+
lines.append("### Phase 1 — Run Automatic Fixes (zero manual effort)")
|
|
2069
|
+
lines.append(f"These {fixable_count} issues can be fixed instantly with `fix_al_workspace`:")
|
|
2070
|
+
for pid in sorted(_AUTO_FIXABLE):
|
|
2071
|
+
count = sum(1 for f in all_findings if f["pattern"] == pid)
|
|
2072
|
+
if count > 0:
|
|
2073
|
+
title = next((p["title"] for p in PATTERNS if p["id"] == pid), pid)
|
|
2074
|
+
lines.append(f" - `{pid}` × {count} — {title}")
|
|
2075
|
+
lines.append(f"\n> **Run:** `fix_al_workspace(\"{folder_path}\", dry_run=False)`")
|
|
2076
|
+
|
|
2077
|
+
# Phase 2: High severity manual fixes
|
|
2078
|
+
high_manual = [f for f in all_findings if f["severity"] == "HIGH" and not _is_pattern_auto_fixable(f["pattern"])]
|
|
2079
|
+
if high_manual:
|
|
2080
|
+
lines.append("\n### Phase 2 — High Severity (manual code changes required)")
|
|
2081
|
+
by_pattern: dict[str, list] = {}
|
|
2082
|
+
for f in high_manual:
|
|
2083
|
+
by_pattern.setdefault(f["pattern"], []).append(f)
|
|
2084
|
+
for pid, findings in sorted(by_pattern.items(), key=lambda x: -len(x[1])):
|
|
2085
|
+
title = next((p["title"] for p in PATTERNS if p["id"] == pid), pid)
|
|
2086
|
+
files_affected = sorted({f["rel_file"] for f in findings})
|
|
2087
|
+
lines.append(f"\n**`{pid}`** × {len(findings)} — {title}")
|
|
2088
|
+
lines.append(f" Files: {', '.join(f'`{f}`' for f in files_affected[:5])}")
|
|
2089
|
+
lines.append(f" > Run `explain_pattern(\"{pid}\")` for the fix pattern")
|
|
2090
|
+
|
|
2091
|
+
# Phase 3: Medium
|
|
2092
|
+
medium_manual = [f for f in all_findings if f["severity"] == "MEDIUM" and not _is_pattern_auto_fixable(f["pattern"])]
|
|
2093
|
+
if medium_manual:
|
|
2094
|
+
by_pattern2: dict[str, int] = {}
|
|
2095
|
+
for f in medium_manual:
|
|
2096
|
+
by_pattern2[f["pattern"]] = by_pattern2.get(f["pattern"], 0) + 1
|
|
2097
|
+
lines.append("\n### Phase 3 — Medium Severity")
|
|
2098
|
+
for pid, count in sorted(by_pattern2.items(), key=lambda x: -x[1]):
|
|
2099
|
+
title = next((p["title"] for p in PATTERNS if p["id"] == pid), pid)
|
|
2100
|
+
lines.append(f" - `{pid}` × {count} — {title}")
|
|
2101
|
+
|
|
2102
|
+
# Drill-down hints
|
|
2103
|
+
lines += [
|
|
2104
|
+
"\n---\n",
|
|
2105
|
+
"## 🔬 Drill Down with Sub-Agents\n",
|
|
2106
|
+
"Call these tools for a full per-file breakdown of each category:\n",
|
|
2107
|
+
]
|
|
2108
|
+
group_tool_map = {
|
|
2109
|
+
"Data Transfer": "scan_data_transfer_issues",
|
|
2110
|
+
"FlowFields": "scan_flowfield_issues",
|
|
2111
|
+
"Aggregation": "scan_aggregation_issues",
|
|
2112
|
+
"Bulk Operations": "scan_bulk_operation_issues",
|
|
2113
|
+
"Existence Checks": "scan_existence_check_issues",
|
|
2114
|
+
"Locking": "scan_locking_issues",
|
|
2115
|
+
"Memory / Copies": "scan_memory_issues",
|
|
2116
|
+
"Short-Circuit Evaluation": "scan_short_circuit_issues",
|
|
2117
|
+
"Write Patterns": "scan_write_pattern_issues",
|
|
2118
|
+
"Cursor Safety": "scan_cursor_safety_issues",
|
|
2119
|
+
"Stale Reads": "scan_stale_read_issues",
|
|
2120
|
+
"Sort / Keys": "scan_data_transfer_issues", # covered by data transfer
|
|
2121
|
+
}
|
|
2122
|
+
for r in group_results:
|
|
2123
|
+
if r["total"] > 0:
|
|
2124
|
+
tool = group_tool_map.get(r["group"], "scan_al_workspace")
|
|
2125
|
+
lines.append(f"- **{r['group']}** ({r['total']} issues) → `{tool}(\"{folder_path}\")`")
|
|
2126
|
+
|
|
2127
|
+
return "\n".join(lines)
|
|
2128
|
+
|
|
2129
|
+
|
|
2130
|
+
if __name__ == "__main__":
|
|
2131
|
+
mcp.run()
|