npm - vision-electronic-indexing-pi - Versions diffs - 0.1.3 → 0.1.4 - Mend

vision-electronic-indexing-pi 0.1.3 → 0.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/.pi/extensions/vision-inventory-mcp/README.md +2 -2
package/.pi/extensions/vision-inventory-mcp/index.ts +2 -2
package/.pi/skills/vision-inventory-workflow/SKILL.md +1 -1
package/README.md +5 -5
package/package.json +1 -1
package/scripts/inventory_folder_to_csv.py +9 -8
package/vision_inventory_mcp.py +6 -5

package/.pi/extensions/vision-inventory-mcp/README.md CHANGED Viewed

@@ -60,7 +60,7 @@ The agent workflow:
 - `/vision-inventory-agent-bom` runs the full agent-assisted datasheet-enrichment workflow.
 - `/vision-inventory-restart` restarts the local Python vision bridge.
-Options are forwarded to `scripts/inventory_folder_to_csv.py`, such as `--recursive`, `--limit`, `--max-side`, and `--jpeg-quality`.
+Options are forwarded to `scripts/inventory_folder_to_csv.py`, such as `--recursive`, `--limit`, `--max-side`, and `--jpeg-quality`. The default `--max-side 0` sends images at full resolution; set a positive value to resize.
 ## Agent tools
@@ -81,7 +81,7 @@ This package intentionally does **not** bundle:
 The main output is `inventory.csv`, with columns:
 ```text
-normalized_part
+likely_part
 candidate_parts
 amount
 sighting_count

package/.pi/extensions/vision-inventory-mcp/index.ts CHANGED Viewed

@@ -362,7 +362,7 @@ export default function (pi: ExtensionAPI) {
     ],
     parameters: Type.Object({
       image_path: Type.String({ description: "Path to the image file, relative to the project root or absolute." }),
-      max_side: Type.Optional(Type.Integer({ description: "Maximum resized image side before submission.", default: 4000 })),
+      max_side: Type.Optional(Type.Integer({ description: "Maximum resized image side before submission. Use 0 for full resolution.", default: 0 })),
       jpeg_quality: Type.Optional(Type.Integer({ description: "JPEG conversion quality from 1 to 100.", default: 96 })),
       custom_prompt: Type.Optional(Type.String({ description: "Optional custom analysis prompt." })),
     }),
@@ -383,7 +383,7 @@ export default function (pi: ExtensionAPI) {
     parameters: Type.Object({
       folder_path: Type.String({ description: "Folder path, relative to the project root or absolute." }),
       recursive: Type.Optional(Type.Boolean({ description: "Whether to scan subfolders.", default: false })),
-      max_side: Type.Optional(Type.Integer({ description: "Maximum resized image side before submission.", default: 4000 })),
+      max_side: Type.Optional(Type.Integer({ description: "Maximum resized image side before submission. Use 0 for full resolution.", default: 0 })),
       jpeg_quality: Type.Optional(Type.Integer({ description: "JPEG conversion quality from 1 to 100.", default: 96 })),
       limit: Type.Optional(Type.Integer({ description: "Optional maximum number of images to process." })),
     }),

package/.pi/skills/vision-inventory-workflow/SKILL.md CHANGED Viewed

@@ -23,7 +23,7 @@ Use `/vision-inventory-setup` to configure credentials and check/install Python
 /vision-inventory-agent-bom <image_folder> <output_dir> [options]
 ```
-Options are forwarded to `scripts/inventory_folder_to_csv.py`, for example `--recursive`, `--limit 3`, `--max-side 4000`, and `--jpeg-quality 96`.
+Options are forwarded to `scripts/inventory_folder_to_csv.py`, for example `--recursive`, `--limit 3`, `--max-side 0`, and `--jpeg-quality 96`. `--max-side 0` means full resolution and is the default.
 ## Agent Rules

package/README.md CHANGED Viewed

@@ -99,7 +99,7 @@ Useful options:
 ```text
 /vision-inventory-agent-bom ./photos ./output --recursive
 /vision-inventory-agent-bom ./photos ./output --limit 3
-/vision-inventory-agent-bom ./photos ./output --max-side 4000 --jpeg-quality 96
+/vision-inventory-agent-bom ./photos ./output --max-side 0 --jpeg-quality 96
 ```
 The agent workflow will:
@@ -135,13 +135,13 @@ verified=false
 ## CSV output columns
-`inventory.csv` is deduplicated by normalized part number. Multiple images, or multiple candidates from one image, can merge into one BOM row.
+`inventory.csv` is deduplicated by `likely_part`, the main/final part number column. Multiple images, or multiple candidates from one image, can merge into one BOM row when they resolve to the same `likely_part`.
 Columns:
 | Column | Description |
 |---|---|
-| `normalized_part` | Final normalized part number, usually from datasheet enrichment. |
+| `likely_part` | Main dedupe key/final likely part number, usually from datasheet enrichment. |
 | `candidate_parts` | Candidate part numbers extracted from visual markings. |
 | `amount` | Estimated quantity for the merged BOM row. |
 | `sighting_count` | Number of evidence rows merged into this BOM row. |
@@ -242,7 +242,7 @@ Before sending an image to Cloudflare Workers AI, the Python server:
 1. Opens the image with Pillow.
 2. Applies EXIF orientation correction.
-3. Resizes only if the image is larger than `max_side`.
+3. Sends full resolution by default; resizes only when `max_side` is set to a positive value and the image is larger than that limit.
 4. Converts transparency to a white background.
 5. Converts the image to RGB.
 6. Encodes it as JPEG.
@@ -251,7 +251,7 @@ Before sending an image to Cloudflare Workers AI, the Python server:
 Defaults:
 ```text
-max_side: 4000
+max_side: 0 (full resolution)
 jpeg_quality: 96
 model: @cf/meta/llama-4-scout-17b-16e-instruct
 ```

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "vision-electronic-indexing-pi",
-  "version": "0.1.3",
+  "version": "0.1.4",
   "description": "Pi package for agent-assisted electronics/PCB image inventory with Cloudflare Workers AI vision and datasheet enrichment.",
   "license": "MIT",
   "repository": {

package/scripts/inventory_folder_to_csv.py CHANGED Viewed

@@ -261,7 +261,7 @@ def image_part_rows(results: List[Dict[str, Any]], cache: Dict[str, Any]) -> Lis
             rows.append({
                 "image": image_name,
                 "candidate_part": "",
-                "normalized_part": "",
+                "likely_part": "",
                 "amount": 0,
                 "description": "",
                 "datasheet_url": "",
@@ -286,6 +286,7 @@ def image_part_rows(results: List[Dict[str, Any]], cache: Dict[str, Any]) -> Lis
         for candidate, candidate_evidence in sorted(evidence_by_candidate.items()):
             enrichment = lookup_enrichment(candidate, cache)
+            likely_part = str(enrichment.get("normalized_part") or candidate).strip().upper()
             amount = estimate_amount_for_candidate(result, candidate, evidence_count=len(candidate_evidence))
             observed_markings = sorted({row["observed_marking"] for row in candidate_evidence})
             observations = "; ".join(
@@ -298,7 +299,7 @@ def image_part_rows(results: List[Dict[str, Any]], cache: Dict[str, Any]) -> Lis
             rows.append({
                 "image": image_name,
                 "candidate_part": candidate,
-                "normalized_part": enrichment.get("normalized_part", candidate),
+                "likely_part": likely_part,
                 "amount": amount,
                 "description": enrichment.get("description", ""),
                 "datasheet_url": enrichment.get("datasheet_url", ""),
@@ -328,7 +329,7 @@ def write_final_csv(results: List[Dict[str, Any]], cache: Dict[str, Any], output
     evidence_fieldnames = [
         "image",
         "candidate_part",
-        "normalized_part",
+        "likely_part",
         "amount",
         "description",
         "datasheet_url",
@@ -345,7 +346,7 @@ def write_final_csv(results: List[Dict[str, Any]], cache: Dict[str, Any], output
     grouped: Dict[str, List[Dict[str, Any]]] = defaultdict(list)
     no_part_rows: List[Dict[str, Any]] = []
     for row in evidence_rows:
-        part = str(row.get("normalized_part") or row.get("candidate_part") or "").strip().upper()
+        part = str(row.get("likely_part") or row.get("candidate_part") or "").strip().upper()
         if not part:
             no_part_rows.append(row)
         else:
@@ -362,7 +363,7 @@ def write_final_csv(results: List[Dict[str, Any]], cache: Dict[str, Any], output
         amount = sum(int(row.get("amount", 0) or 0) for row in rows_for_part)
         bom_rows.append({
-            "normalized_part": part,
+            "likely_part": part,
             "candidate_parts": " | ".join(sorted({str(row["candidate_part"]) for row in rows_for_part if row.get("candidate_part")})),
             "amount": amount,
             "sighting_count": len(rows_for_part),
@@ -380,7 +381,7 @@ def write_final_csv(results: List[Dict[str, Any]], cache: Dict[str, Any], output
     for row in no_part_rows:
         bom_rows.append({
-            "normalized_part": "",
+            "likely_part": "",
             "candidate_parts": "",
             "amount": 0,
             "sighting_count": 1,
@@ -397,7 +398,7 @@ def write_final_csv(results: List[Dict[str, Any]], cache: Dict[str, Any], output
         })
     bom_fieldnames = [
-        "normalized_part",
+        "likely_part",
         "candidate_parts",
         "amount",
         "sighting_count",
@@ -424,7 +425,7 @@ def parse_args() -> argparse.Namespace:
     parser.add_argument("--recursive", action="store_true", help="Scan image_folder recursively")
     parser.add_argument("--limit", type=int, default=None, help="Maximum number of images to process")
     parser.add_argument("--skip-vision", action="store_true", help="Reuse existing output_dir/raw/*.json instead of calling vision AI")
-    parser.add_argument("--max-side", type=int, default=vision.DEFAULT_MAX_SIDE, help="Maximum resized image side")
+    parser.add_argument("--max-side", type=int, default=vision.DEFAULT_MAX_SIDE, help="Maximum resized image side; use 0 for full resolution (default)")
     parser.add_argument("--jpeg-quality", type=int, default=vision.DEFAULT_JPEG_QUALITY, help="JPEG quality for model input")
     return parser.parse_args()

package/vision_inventory_mcp.py CHANGED Viewed

@@ -56,7 +56,7 @@ except ImportError:  # pragma: no cover - compatibility fallback
 DEFAULT_MODEL = os.getenv("WORKERS_AI_MODEL", "@cf/meta/llama-4-scout-17b-16e-instruct")
-DEFAULT_MAX_SIDE = 4000
+DEFAULT_MAX_SIDE = 0
 DEFAULT_JPEG_QUALITY = 96
 DEFAULT_MAX_TOKENS = 1600
 DEFAULT_TEMPERATURE = 0.05
@@ -184,8 +184,8 @@ def prepare_image_data_url(
     max_side: int = DEFAULT_MAX_SIDE,
     jpeg_quality: int = DEFAULT_JPEG_QUALITY,
 ) -> Tuple[Optional[str], Optional[Dict[str, Any]]]:
-    if max_side < 256:
-        return None, error_response("max_side must be at least 256.")
+    if max_side and max_side < 256:
+        return None, error_response("max_side must be 0 for full resolution or at least 256.")
     if jpeg_quality < 1 or jpeg_quality > 100:
         return None, error_response("jpeg_quality must be between 1 and 100.")
@@ -194,8 +194,9 @@ def prepare_image_data_url(
         image = Image.open(image_path)
         image = ImageOps.exif_transpose(image)
-        resample = getattr(Image, "Resampling", Image).LANCZOS
-        image.thumbnail((max_side, max_side), resample)
+        if max_side:
+            resample = getattr(Image, "Resampling", Image).LANCZOS
+            image.thumbnail((max_side, max_side), resample)
         # Convert transparency to white background before JPEG encoding.
         if image.mode in ("RGBA", "LA"):