PyPI - Semapp - Versions diffs - 1.0.5__py3-none-any.whl - Mend

Semapp 1.0.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

semapp/Layout/__init__.py +26 -0
semapp/Layout/create_button.py +1248 -0
semapp/Layout/main_window_att.py +54 -0
semapp/Layout/settings.py +170 -0
semapp/Layout/styles.py +152 -0
semapp/Layout/toast.py +157 -0
semapp/Plot/__init__.py +8 -0
semapp/Plot/frame_attributes.py +690 -0
semapp/Plot/overview_window.py +355 -0
semapp/Plot/styles.py +55 -0
semapp/Plot/utils.py +295 -0
semapp/Processing/__init__.py +4 -0
semapp/Processing/detection.py +513 -0
semapp/Processing/klarf_reader.py +461 -0
semapp/Processing/processing.py +686 -0
semapp/Processing/rename_tif.py +498 -0
semapp/Processing/split_tif.py +323 -0
semapp/Processing/threshold.py +777 -0
semapp/__init__.py +10 -0
semapp/asset/icon.png +0 -0
semapp/main.py +103 -0
semapp-1.0.5.dist-info/METADATA +300 -0
semapp-1.0.5.dist-info/RECORD +27 -0
semapp-1.0.5.dist-info/WHEEL +5 -0
semapp-1.0.5.dist-info/entry_points.txt +2 -0
semapp-1.0.5.dist-info/licenses/LICENSE +674 -0
semapp-1.0.5.dist-info/top_level.txt +1 -0

semapp/Processing/processing.py ADDED Viewed

@@ -0,0 +1,686 @@
+"""
+Module for processing and renaming TIFF files based on CSV coordinates.
+"""
+import json
+import re
+import glob
+import shutil
+import os
+from PIL import Image
+import pandas as pd
+from semapp.Processing.klarf_reader import extract_positions
+from semapp.Processing.rename_tif import rename_files, rename_files_all
+from semapp.Processing.split_tif import split_tiff, split_tiff_all
+class Process:
+    """
+    A class to handle processing of TIFF files and renaming them based on
+    coordinates from KLARF files.
+    This class supports three modes:
+    - Normal mode: Standard KLARF format with subdirectories
+    - COMPLUS4T mode: Multi-wafer KLARF files in parent directory
+    - KRONOS mode: Special format with OCR-based number detection
+    """
+    def __init__(self, dirname, wafer=None, scale=None):
+        """
+        Initialize the processing instance with necessary parameters.
+        Args:
+            dirname (str): The base directory for the files.
+            wafer (int, optional): The wafer number. Defaults to None.
+            scale (str, optional): The path to the settings JSON file. Defaults to None.
+        """
+        self.dirname = dirname
+        self.scale_data = scale
+        self.wafer_number = str(wafer)
+        self.tiff_path = None
+        self.coordinates = None
+        self.settings = None
+        self.output_dir = None
+        self.load_json()
+    def load_json(self):
+        """
+        Load the settings data from a JSON file.
+        The settings file should contain a list of dictionaries with
+        'Scale' and 'Image Type' keys. If the file is not found or
+        invalid, an empty list is used.
+        """
+        if not self.scale_data:
+            self.settings = []
+            return
+        try:
+            with open(self.scale_data, "r", encoding="utf-8") as file:
+                self.settings = json.load(file)
+        except FileNotFoundError:
+            # Settings file not found, starting fresh
+            self.settings = []
+        except json.JSONDecodeError:
+            # JSON decoding error
+            self.settings = []
+        except OSError:
+            # OS error when reading file
+            self.settings = []
+    def extract_positions(self, filepath):
+        """
+        Extract defect positions from KLARF file.
+        Wrapper method that calls the klarf_reader module. Automatically
+        detects the mode (KRONOS, COMPLUS4T, or normal) and extracts
+        coordinates accordingly.
+        Args:
+            filepath (str): Path to the KLARF (.001) file
+        Returns:
+            pd.DataFrame: DataFrame with columns ["defect_id", "X", "Y", "defect_size"]
+                Returns empty DataFrame if file cannot be parsed.
+        """
+        # Convert self.wafer_number to int if it's not None (for COMPLUS4T mode)
+        wafer_id = None
+        if self.wafer_number and self.wafer_number != "None":
+            try:
+                wafer_id = int(self.wafer_number)
+            except (ValueError, TypeError):
+                wafer_id = None
+        # Call the klarf_reader function
+        self.coordinates = extract_positions(filepath, wafer_id=wafer_id)
+        return self.coordinates
+    def rename(self):
+        """
+        Rename TIFF files based on coordinates from KLARF file.
+        Wrapper method that calls the rename_tif module. Automatically
+        detects the mode and uses the appropriate renaming scheme:
+        - Normal mode: Uses scale and image type from settings
+        - COMPLUS4T mode: Uses only X and Y coordinates
+        - KRONOS mode: Uses only X and Y coordinates
+        The method verifies that no duplicate scale/image_type combinations
+        exist before proceeding.
+        """
+        print("\n" + "="*80)
+        print("[DEBUG] rename() called")
+        print(f"[DEBUG] dirname: {self.dirname}")
+        print(f"[DEBUG] wafer_number: {self.wafer_number}")
+        print("="*80)
+        # Security check: verify no duplicate scale/image_type combinations
+        scale_image_combinations = []
+        for setting in self.settings:
+            combination = f"{setting['Scale']}_{setting['Image Type']}"
+            scale_image_combinations.append(combination)
+        # Check for duplicates
+        if len(scale_image_combinations) != len(set(scale_image_combinations)):
+            duplicate_combinations = []
+            seen = set()
+            for combo in scale_image_combinations:
+                if combo in seen:
+                    duplicate_combinations.append(combo)
+                else:
+                    seen.add(combo)
+            print(f"Warning: Duplicate scale/image_type combinations found: {duplicate_combinations}. "
+                  f"Skipping rename operation.")
+            return
+        self.output_dir = os.path.join(self.dirname, self.wafer_number)
+        print(f"[DEBUG] output_dir: {self.output_dir}")
+        if not os.path.exists(self.output_dir):
+            print(f"[DEBUG] output_dir does not exist, returning")
+            return
+        # Check if COMPLUS4T mode: .001 files are in parent directory
+        is_complus4t = self._check_complus4t_mode()
+        print(f"[DEBUG] is_complus4t: {is_complus4t}")
+        if is_complus4t:
+            # COMPLUS4T mode: .001 file is in parent directory
+            matching_files = glob.glob(os.path.join(self.dirname, '*.001'))
+            print(f"[DEBUG] COMPLUS4T: Found {len(matching_files)} .001 files in parent directory")
+            recipe_path = None
+            # Find the .001 file that contains the selected wafer ID
+            for file_path in matching_files:
+                print(f"[DEBUG] Checking file: {os.path.basename(file_path)} for wafer {self.wafer_number}")
+                if self._is_wafer_in_klarf(file_path, int(self.wafer_number)):
+                    recipe_path = file_path
+                    print(f"[DEBUG] Found matching .001 file: {recipe_path}")
+                    break
+        else:
+            # Normal/KRONOS mode: .001 file is in wafer subdirectory
+            matching_files = glob.glob(os.path.join(self.output_dir, '*.001'))
+            print(f"[DEBUG] Normal/KRONOS: Found {len(matching_files)} .001 files in output_dir")
+            if matching_files:
+                recipe_path = matching_files[0]
+                print(f"[DEBUG] Using .001 file: {recipe_path}")
+            else:
+                recipe_path = None
+        if recipe_path:
+            # Check if KRONOS mode
+            is_kronos = self._check_kronos_mode(recipe_path)
+            print(f"[DEBUG] is_kronos: {is_kronos}")
+            # For COMPLUS4T, pass wafer_id explicitly. For normal mode, pass None
+            if is_complus4t:
+                # Temporarily store original wafer_number and set it for extract_positions
+                original_wafer_number = self.wafer_number
+                print(f"[DEBUG] COMPLUS4T: Setting wafer_number to {self.wafer_number} for extract_positions")
+                self.wafer_number = str(self.wafer_number)
+                self.coordinates = self.extract_positions(recipe_path)
+                self.wafer_number = original_wafer_number
+                print(f"[DEBUG] COMPLUS4T: Extracted {len(self.coordinates)} coordinates")
+            else:
+                # Normal mode: set wafer_number to None so extract_positions reads all defects
+                original_wafer_number = self.wafer_number
+                print(f"[DEBUG] Normal/KRONOS: Setting wafer_number to None for extract_positions")
+                self.wafer_number = None
+                self.coordinates = self.extract_positions(recipe_path)
+                self.wafer_number = original_wafer_number
+                print(f"[DEBUG] Normal/KRONOS: Extracted {len(self.coordinates)} coordinates")
+        else:
+            print(f"[DEBUG] Warning: No .001 file found for wafer {self.wafer_number}")
+            return
+        # Check if KRONOS mode (if not already checked)
+        if not is_complus4t and recipe_path:
+            is_kronos = self._check_kronos_mode(recipe_path)
+        else:
+            is_kronos = False
+        print(f"[DEBUG] Final is_kronos: {is_kronos}")
+        print(f"[DEBUG] Coordinates DataFrame:")
+        print(self.coordinates)
+        # Call the rename_tif module function
+        renamed_count = rename_files(
+            output_dir=self.output_dir,
+            coordinates=self.coordinates,
+            settings=self.settings,
+            is_kronos=is_kronos,
+            is_complus4t=is_complus4t
+        )
+        print(f"[DEBUG] Total files renamed: {renamed_count}")
+        print("="*80 + "\n")
+    def split_tiff(self):
+        """
+        Split a merged TIFF file into individual TIFF files.
+        Wrapper method that calls the split_tif module.
+        Returns:
+            list: List of file paths of the generated TIFF files.
+        """
+        # Check if COMPLUS4T mode: TIFF file is in parent directory
+        is_complus4t = self._check_complus4t_mode()
+        if is_complus4t:
+            # COMPLUS4T mode: TIFF file is in parent directory
+            tiff_files = glob.glob(os.path.join(self.dirname, '*.tiff'))
+            if not tiff_files:
+                tiff_files = glob.glob(os.path.join(self.dirname, '*.tif'))
+            if tiff_files:
+                self.tiff_path = tiff_files[0]  # Use first TIFF file found
+            else:
+                return []
+            # Output directory is the wafer subdirectory
+            output_dir = os.path.join(self.dirname, self.wafer_number)
+            # For COMPLUS4T: extract positions first to get defect_id list
+            matching_files = glob.glob(os.path.join(self.dirname, '*.001'))
+            recipe_path = None
+            # Find the .001 file that contains the selected wafer ID
+            for file_path in matching_files:
+                if self._is_wafer_in_klarf(file_path, int(self.wafer_number)):
+                    recipe_path = file_path
+                    break
+            if not recipe_path:
+                print(f"Warning: No .001 file found for wafer {self.wafer_number}")
+                return []
+            # Extract coordinates to get defect_id list
+            self.coordinates = self.extract_positions(recipe_path)
+            if self.coordinates is None or self.coordinates.empty:
+                print(f"Warning: No coordinates found for wafer {self.wafer_number}")
+                return []
+        else:
+            # Normal/KRONOS mode: TIFF file is in wafer subdirectory
+            self.tiff_path = os.path.join(self.dirname,
+                                          self.wafer_number,
+                                          "data.tif")
+            output_dir = os.path.join(self.dirname, self.wafer_number)
+            self.coordinates = None  # Not needed for normal/KRONOS mode
+        # Check if KRONOS mode
+        is_kronos = False
+        if not is_complus4t:
+            # Check for KRONOS in the wafer subdirectory
+            matching_files = glob.glob(os.path.join(output_dir, '*.001'))
+            if matching_files:
+                is_kronos = self._check_kronos_mode(matching_files[0])
+        # Call the split_tif module function
+        output_files = split_tiff(
+            tiff_path=self.tiff_path,
+            output_dir=output_dir,
+            coordinates=self.coordinates,
+            is_kronos=is_kronos,
+            is_complus4t=is_complus4t
+        )
+        return output_files
+    def clean(self):
+        """
+        Clean up the output directory by deleting any non-conforming TIFF files.
+        This method deletes any files that do not follow the expected naming
+        conventions (files not starting with "data" or
+        containing the word "page").
+        """
+        self.output_dir = os.path.join(self.dirname, self.wafer_number)
+        if not os.path.exists(self.output_dir):
+            return
+        tiff_files = [f for f in os.listdir(self.output_dir)
+                      if f.lower().endswith(('.tiff', '.tif'))]
+        # Delete non-conforming files
+        for file_name in tiff_files:
+            if not file_name.startswith("data") or "page" in file_name.lower() or file_name.endswith("001"):
+                file_path = os.path.join(self.output_dir, file_name)
+                os.remove(file_path)
+    def split_tiff_all(self):
+        """
+        Split all merged TIFF files in the directory (including subdirectories)
+        into individual TIFF files.
+        Wrapper method that calls the split_tif module.
+        This method will look through all directories and split each `data.tif`
+        file into separate pages.
+        """
+        # Check if COMPLUS4T mode
+        is_complus4t = self._check_complus4t_mode()
+        coordinates_dict = None
+        is_kronos = False
+        if is_complus4t:
+            # COMPLUS4T mode: need to extract coordinates for all wafers
+            matching_files = glob.glob(os.path.join(self.dirname, '*.001'))
+            if not matching_files:
+                print("Warning: No .001 file found in parent directory for COMPLUS4T mode")
+                return []
+            parent_recipe_path = matching_files[0]
+            coordinates_dict = {}
+            # Extract coordinates for each wafer
+            for subdir, _, _ in os.walk(self.dirname):
+                if subdir == self.dirname:
+                    continue
+                try:
+                    wafer_num = int(os.path.basename(subdir))
+                except ValueError:
+                    continue
+                original_wafer_number = self.wafer_number
+                self.wafer_number = str(wafer_num)
+                coordinates = self.extract_positions(parent_recipe_path)
+                self.wafer_number = original_wafer_number
+                if coordinates is not None and not coordinates.empty:
+                    coordinates_dict[wafer_num] = coordinates
+        else:
+            # Normal/KRONOS mode: check for KRONOS in first subdirectory
+            for subdir, _, _ in os.walk(self.dirname):
+                if subdir == self.dirname:
+                    continue
+                matching_files = glob.glob(os.path.join(subdir, '*.001'))
+                if matching_files:
+                    is_kronos = self._check_kronos_mode(matching_files[0])
+                break
+        # Call the split_tif module function
+        output_files = split_tiff_all(
+            dirname=self.dirname,
+            coordinates_dict=coordinates_dict,
+            is_kronos=is_kronos,
+            is_complus4t=is_complus4t
+        )
+        return output_files
+    def rename_all(self):
+        """
+        Rename all TIFF files based on the coordinates from the
+        CSV file in all subdirectories.
+        Wrapper method that calls the rename_tif module.
+        This method will iterate through all subdirectories,
+        loading the CSV and settings, and renaming files accordingly.
+        """
+        print("\n" + "="*80)
+        print("[DEBUG] rename_all() called")
+        print(f"[DEBUG] dirname: {self.dirname}")
+        print("="*80)
+        # Security check: verify no duplicate scale/image_type combinations
+        scale_image_combinations = []
+        for setting in self.settings:
+            combination = f"{setting['Scale']}_{setting['Image Type']}"
+            scale_image_combinations.append(combination)
+        # Check for duplicates
+        if len(scale_image_combinations) != len(set(scale_image_combinations)):
+            duplicate_combinations = []
+            seen = set()
+            for combo in scale_image_combinations:
+                if combo in seen:
+                    duplicate_combinations.append(combo)
+                else:
+                    seen.add(combo)
+            print(f"Warning: Duplicate scale/image_type combinations found: {duplicate_combinations}. "
+                  f"Skipping rename operation.")
+            return
+        # Check if COMPLUS4T mode: .001 files are in parent directory
+        is_complus4t = self._check_complus4t_mode()
+        print(f"[DEBUG] is_complus4t: {is_complus4t}")
+        if is_complus4t:
+            # COMPLUS4T mode: .001 file is in parent directory, find it once
+            matching_files = glob.glob(os.path.join(self.dirname, '*.001'))
+            print(f"[DEBUG] COMPLUS4T: Found {len(matching_files)} .001 files in parent directory")
+            if not matching_files:
+                print("[DEBUG] Warning: No .001 file found in parent directory for COMPLUS4T mode")
+                return
+            parent_recipe_path = matching_files[0]
+            print(f"[DEBUG] COMPLUS4T: Using parent recipe_path: {parent_recipe_path}")
+        # Build coordinates dictionary for all wafers
+        coordinates_dict = {}
+        is_kronos = False
+        for subdir, _, _ in os.walk(self.dirname):
+            if subdir == self.dirname:
+                continue
+            output_dir = os.path.join(self.dirname, os.path.basename(subdir))
+            try:
+                wafer_num = int(os.path.basename(subdir))
+            except ValueError:
+                continue
+            print(f"\n[DEBUG] Processing subdirectory: {subdir}")
+            print(f"[DEBUG] output_dir: {output_dir}")
+            print(f"[DEBUG] Extracted wafer_num: {wafer_num}")
+            if is_complus4t:
+                # COMPLUS4T mode: use parent .001 file and pass wafer_id
+                recipe_path = parent_recipe_path
+                print(f"[DEBUG] COMPLUS4T: Using recipe_path: {recipe_path} for wafer {wafer_num}")
+                original_wafer_number = self.wafer_number
+                self.wafer_number = str(wafer_num)
+                print(f"[DEBUG] COMPLUS4T: Setting wafer_number to {self.wafer_number} for extract_positions")
+                coordinates = self.extract_positions(recipe_path)
+                self.wafer_number = original_wafer_number
+                print(f"[DEBUG] COMPLUS4T: Extracted {len(coordinates)} coordinates for wafer {wafer_num}")
+            else:
+                # Normal/KRONOS mode: .001 file is in wafer subdirectory
+                matching_files = glob.glob(os.path.join(output_dir, '*.001'))
+                print(f"[DEBUG] Normal/KRONOS: Found {len(matching_files)} .001 files in output_dir")
+                if matching_files:
+                    recipe_path = matching_files[0]
+                    is_kronos = self._check_kronos_mode(recipe_path)
+                    print(f"[DEBUG] is_kronos: {is_kronos}")
+                    original_wafer_number = self.wafer_number
+                    self.wafer_number = None
+                    coordinates = self.extract_positions(recipe_path)
+                    self.wafer_number = original_wafer_number
+                    print(f"[DEBUG] Normal/KRONOS: Extracted {len(coordinates)} coordinates")
+                else:
+                    print(f"[DEBUG] No .001 file found in {output_dir}, skipping")
+                    continue
+            if coordinates is None or coordinates.empty:
+                print(f"[DEBUG] Warning: Coordinates are None or empty for wafer {wafer_num}")
+                continue
+            coordinates_dict[wafer_num] = coordinates
+        # Call the rename_tif module function
+        total_renamed = rename_files_all(
+            dirname=self.dirname,
+            coordinates_dict=coordinates_dict,
+            settings=self.settings,
+            is_kronos=is_kronos,
+            is_complus4t=is_complus4t
+        )
+        print(f"\n[DEBUG] Total files renamed across all directories: {total_renamed}")
+        print("="*80 + "\n")
+    def clean_all(self):
+        """
+        Delete all non-conforming TIFF files in all subdirectories.
+        This method will remove any files that do not follow the expected
+         naming conventions in all directories.
+        """
+        for subdir, _, _ in os.walk(self.dirname):
+            if subdir != self.dirname:
+                self.output_dir = os.path.join(self.dirname,
+                                               os.path.basename(subdir))
+                if not os.path.exists(self.output_dir):
+                    continue
+                tiff_files = [f for f in os.listdir(self.output_dir)
+                              if f.lower().endswith(('.tiff', '.tif'))]
+                for file_name in tiff_files:
+                    if not file_name.startswith("data") or \
+                            "page" in file_name.lower() or file_name.endswith("001"):
+                        file_path = os.path.join(self.output_dir, file_name)
+                        os.remove(file_path)
+    def organize_and_rename_files(self):
+        """
+        Organize TIFF files into subfolders based
+        on the last split of their name
+        and rename the files to 'data.tif' in their respective subfolders.
+        """
+        if not os.path.exists(self.dirname):
+            return
+        # Check if there are subdirectories
+        subdirs = [d for d in os.listdir(self.dirname) if
+                   os.path.isdir(os.path.join(self.dirname, d))]
+        # Check if there are .tif files
+        tif_files = [f for f in os.listdir(self.dirname)
+                     if f.lower().endswith(".tif") and os.path.isfile(os.path.join(self.dirname, f))]
+        # Iterate through files in the directory
+        for file_name in os.listdir(self.dirname):
+            if file_name.lower().endswith(".tif"):
+                parts = file_name.rsplit("_", 1)
+                if len(parts) < 2:
+                    # Skip file with unexpected format
+                    continue
+                # Use the last part (before extension) as the subfolder name
+                subfolder_name = parts[-1].split(".")[0]
+                subfolder_path = os.path.join(self.dirname, subfolder_name)
+                # Create the subfolder if it does not exist
+                os.makedirs(subfolder_path, exist_ok=True)
+                # Move and rename the file
+                source_path = os.path.join(self.dirname, file_name)
+                destination_path = os.path.join(subfolder_path, "data.tif")
+                shutil.move(source_path, destination_path)
+            if file_name.lower().endswith(".001"):
+                parts = file_name.rsplit("_", 1)
+                if len(parts) < 2:
+                    # Skip file with unexpected format
+                    continue
+                # Use the last part (before extension) as the subfolder name
+                subfolder_name = parts[-1].split(".")[0]
+                subfolder_path = os.path.join(self.dirname, subfolder_name)
+                # Create the subfolder if it does not exist
+                os.makedirs(subfolder_path, exist_ok=True)
+                # Move and rename the file
+                source_path = os.path.join(self.dirname, file_name)
+                destination_path = os.path.join(subfolder_path, file_name)
+                shutil.move(source_path, destination_path)
+        # If no subdirectories and no .tif files, create folders from KLARF files
+        if not subdirs and not tif_files:
+            wafer_ids = self.extract_wafer_ids_from_klarf()
+            if wafer_ids:
+                for wafer_id in wafer_ids:
+                    subfolder_path = os.path.join(self.dirname, str(wafer_id))
+                    os.makedirs(subfolder_path, exist_ok=True)
+    def _check_complus4t_mode(self):
+        """Check if we are in COMPLUS4T mode (.001 files with COMPLUS4T in parent directory)."""
+        if not self.dirname or not os.path.exists(self.dirname):
+            return False
+        # Check for .001 files with COMPLUS4T in the parent directory
+        matching_files = glob.glob(os.path.join(self.dirname, '*.001'))
+        for file_path in matching_files:
+            try:
+                with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
+                    content = f.read()
+                    if 'COMPLUS4T' in content:
+                        return True
+            except Exception:
+                pass
+        return False
+    def _check_kronos_mode(self, filepath=None):
+        """Check if we are in KRONOS mode (.001 files with KRONOS format)."""
+        if filepath:
+            # Check specific file
+            try:
+                with open(filepath, 'r', encoding='utf-8', errors='ignore') as f:
+                    for line in f:
+                        if 'KRONOS' in line or re.search(r'WaferID\s+"Read Failed\.(\d+)"', line):
+                            return True
+            except Exception:
+                pass
+        else:
+            # Check parent directory
+            if not self.dirname or not os.path.exists(self.dirname):
+                return False
+            matching_files = glob.glob(os.path.join(self.dirname, '*.001'))
+            for file_path in matching_files:
+                try:
+                    with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
+                        for line in f:
+                            if 'KRONOS' in line or re.search(r'WaferID\s+"Read Failed\.(\d+)"', line):
+                                return True
+                except Exception:
+                    pass
+        return False
+    def _is_wafer_in_klarf(self, file_path, wafer_id):
+        """Check if a specific wafer ID is in the KLARF file."""
+        try:
+            with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
+                for line in f:
+                    # Check for COMPLUS4T format: WaferID "@11"
+                    match = re.search(r'WaferID\s+"@(\d+)"', line)
+                    if match:
+                        if int(match.group(1)) == wafer_id:
+                            return True
+        except Exception:
+            pass
+        return False
+    def extract_wafer_ids_from_klarf(self):
+        """Extract wafer IDs from KLARF files (.001) that contain COMPLUS4T."""
+        wafer_ids = []
+        if not self.dirname:
+            return wafer_ids
+        # Search for .001 files
+        try:
+            files = [f for f in os.listdir(self.dirname)
+                    if f.endswith('.001') and os.path.isfile(os.path.join(self.dirname, f))]
+            for file in files:
+                file_path = os.path.join(self.dirname, file)
+                try:
+                    with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
+                        content = f.read()
+                        # Check if file contains "COMPLUS4T"
+                        if 'COMPLUS4T' in content:
+                            # Search for all lines with WaferID
+                            # Pattern to extract number in quotes after WaferID
+                            pattern = r'WaferID\s+"@(\d+)"'
+                            matches = re.findall(pattern, content)
+                            # Add found IDs (converted to int)
+                            for match in matches:
+                                wafer_id = int(match)
+                                if wafer_id not in wafer_ids and 1 <= wafer_id <= 26:
+                                    wafer_ids.append(wafer_id)
+                except Exception:
+                    pass  # Error reading file
+        except Exception:
+            pass  # Error listing files
+        return wafer_ids
+if __name__ == "__main__":
+    DIRNAME = r"C:\Users\TM273821\Desktop\SEM\D25S2039_200_MOS2_SIO2_API"
+    SCALE = r"C:\Users\TM273821\SEM\settings_data.json"
+    processor = Process(DIRNAME, wafer=18, scale=SCALE)
+    # Process files
+    # processor.organize_and_rename_files()  # Organize and rename files
+    # processor.rename_wo_legend_all()  # Preprocess all files in the directory
+    # processor.rename_wo_legend()  # Preprocess specific wafer
+    # processor.split_tiff_all()  # Preprocess specific wafer
+    # processor.split_tiff_all()  # Preprocess specific wafer
+    # processor.split_tiff()  # Preprocess specific wafer
+    processor.rename_all()  # Preprocess specific wafer