PyPI - halib - Versions diffs - 0.2.8__py3-none-any.whl → 0.2.10__py3-none-any.whl - Mend

halib 0.2.8py3-none-any.whl → 0.2.10py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

halib/exp/core/base_exp.py +119 -140
halib/system/_list_pc.csv +6 -0
halib/system/path.py +31 -19
{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/METADATA +2 -2
{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/RECORD +8 -7
{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/WHEEL +0 -0
{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/licenses/LICENSE.txt +0 -0
{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/top_level.txt +0 -0

halib/exp/core/base_exp.py CHANGED Viewed

@@ -1,168 +1,147 @@
-import os
-from rich.pretty import pprint
 from abc import ABC, abstractmethod
-from typing import List, Optional, TypeVar, Generic
-from abc import ABC, abstractmethod
-from dataclasses import dataclass
-from dataclass_wizard import YAMLWizard
-class NamedCfg(ABC):
-    """
-    Base class for named configurations.
-    All configurations should have a name.
-    """
-    @abstractmethod
-    def get_name(self):
-        """
-        Get the name of the configuration.
-        This method should be implemented in subclasses.
-        """
-        pass
-@dataclass
-class AutoNamedCfg(YAMLWizard, NamedCfg):
-    """
-    Mixin that automatically implements get_name() by returning self.name.
-    Classes using this MUST have a 'name' field.
-    """
-    name: Optional[str] = None
-    def get_name(self):
-        return self.name
-    def __post_init__(self):
-        # Enforce the "MUST" rule here
-        if self.name is None:
-            # We allow None during initial load, but it must be set before usage
-            # or handled by the loader.
-            pass
-T = TypeVar("T", bound=AutoNamedCfg)
+from typing import Tuple, Any, Optional
+from .base_config import ExpBaseCfg
+from ..perf.perfcalc import PerfCalc
+from ..perf.perfmetrics import MetricsBackend
-class BaseSelectorCfg(Generic[T]):
-    """
-    Base class to handle the logic of selecting an item from a list by name.
-    """
-    def _resolve_selection(self, items: List[T], selected_name: str, context: str) -> T:
-        if selected_name is None:
-            raise ValueError(f"No {context} selected in the configuration.")
-        # Create a lookup dict for O(1) access, or just iterate if list is short
-        for item in items:
-            if item.name == selected_name:
-                return item
+class ExpHook:
+    """Base interface for all experiment hooks."""
+    def on_before_run(self, exp): pass
+    def on_after_run(self, exp, results): pass
-        raise ValueError(
-            f"{context.capitalize()} '{selected_name}' not found in the configuration list."
-        )
-class ExpBaseCfg(ABC, YAMLWizard):
+# ! SEE https://github.com/hahv/base_exp for sample usage
+class BaseExp(PerfCalc, ABC):
     """
-    Base class for configuration objects.
-    What a cfg class must have:
-    1 - a dataset cfg
-    2 - a metric cfg
-    3 - a method cfg
+    Base class for experiments.
+    Orchestrates the experiment pipeline using a pluggable metrics backend.
     """
-    cfg_name: Optional[str] = None
-    # Save to yaml fil
-    def save_to_outdir(
-        self, filename: str = "__config.yaml", outdir=None, override: bool = False
-    ) -> None:
-        """
-        Save the configuration to the output directory.
-        """
-        if outdir is not None:
-            output_dir = outdir
-        else:
-            output_dir = self.get_outdir()
-        os.makedirs(output_dir, exist_ok=True)
-        assert (output_dir is not None) and (
-            os.path.isdir(output_dir)
-        ), f"Output directory '{output_dir}' does not exist or is not a directory."
-        file_path = os.path.join(output_dir, filename)
-        if os.path.exists(file_path) and not override:
-            pprint(
-                f"File '{file_path}' already exists. Use 'override=True' to overwrite."
-            )
-        else:
-            # method of YAMLWizard to_yaml_file
-            self.to_yaml_file(file_path)
-    @classmethod
+    def __init__(self, config: ExpBaseCfg):
+        self.config = config
+        self.metric_backend = None
+        # Flag to track if init_general/prepare_dataset has run
+        self._is_env_ready = False
+        self.hooks = []
+    def register_hook(self, hook: ExpHook):
+        self.hooks.append(hook)
+    def _trigger_hooks(self, method_name: str, *args, **kwargs):
+        for hook in self.hooks:
+            method = getattr(hook, method_name, None)
+            if callable(method):
+                method(*args, **kwargs)
+    # -----------------------
+    # PerfCalc Required Methods
+    # -----------------------
+    def get_dataset_name(self):
+        return self.config.get_dataset_cfg().get_name()
+    def get_experiment_name(self):
+        return self.config.get_cfg_name()
+    def get_metric_backend(self):
+        if not self.metric_backend:
+            self.metric_backend = self.prepare_metrics(self.config.get_metric_cfg())
+        return self.metric_backend
+    # -----------------------
+    # Abstract Experiment Steps
+    # -----------------------
     @abstractmethod
-    # load from a custom YAML file
-    def from_custom_yaml_file(cls, yaml_file: str):
-        """Load a configuration from a custom YAML file."""
+    def init_general(self, general_cfg):
+        """Setup general settings like SEED, logging, env variables."""
         pass
-    def get_cfg_name(self, sep: str = "__", *args, **kwargs) -> str:
-        if self.cfg_name is None:
-            # auto get the config name from dataset, method, metric
-            # 2. Generate the canonical Config Name
-            name_parts = []
-            general_info = self.get_general_cfg().get_name()
-            dataset_info = self.get_dataset_cfg().get_name()
-            method_info = self.get_method_cfg().get_name()
-            name_parts = [
-                general_info,
-                f"ds_{dataset_info}",
-                f"mt_{method_info}",
-            ]
-            if "extra" in kwargs:
-                extra_info = kwargs["extra"]
-                assert isinstance(extra_info, str), "'extra' kwarg must be a string."
-                name_parts.append(extra_info)
-            self.cfg_name = sep.join(name_parts)
-        return self.cfg_name
     @abstractmethod
-    def get_outdir(self):
-        """
-        Get the output directory for the configuration.
-        This method should be implemented in subclasses.
-        """
-        return None
+    def prepare_dataset(self, dataset_cfg):
+        """Load/prepare dataset."""
+        pass
     @abstractmethod
-    def get_general_cfg(self) -> NamedCfg:
+    def prepare_metrics(self, metric_cfg) -> MetricsBackend:
         """
-        Get the general configuration like output directory, log settings, SEED, etc.
+        Prepare the metrics for the experiment.
         This method should be implemented in subclasses.
         """
         pass
     @abstractmethod
-    def get_dataset_cfg(self) -> NamedCfg:
-        """
-        Get the dataset configuration.
-        This method should be implemented in subclasses.
+    def exec_exp(self, *args, **kwargs) -> Optional[Tuple[Any, Any]]:
+        """Run experiment process, e.g.: training/evaluation loop.
+        Return: either `None` or a tuple of (raw_metrics_data, extra_data) for calc_and_save_exp_perfs
         """
         pass
-    @abstractmethod
-    def get_method_cfg(self) -> NamedCfg:
+    # -----------------------
+    # Internal Helpers
+    # -----------------------
+    def _validate_and_unpack(self, results):
+        if results is None:
+            return None
+        if not isinstance(results, (tuple, list)) or len(results) != 2:
+            raise ValueError("exec must return (metrics_data, extra_data)")
+        return results[0], results[1]
+    def _prepare_environment(self, force_reload: bool = False):
         """
-        Get the method configuration.
-        This method should be implemented in subclasses.
+        Common setup. Skips if already initialized, unless force_reload is True.
         """
-        pass
+        if self._is_env_ready and not force_reload:
+            # Environment is already prepared, skipping setup.
+            return
-    @abstractmethod
-    def get_metric_cfg(self) -> NamedCfg:
+        # 1. Run Setup
+        self.init_general(self.config.get_general_cfg())
+        self.prepare_dataset(self.config.get_dataset_cfg())
+        # 2. Update metric backend (refresh if needed)
+        self.metric_backend = self.prepare_metrics(self.config.get_metric_cfg())
+        # 3. Mark as ready
+        self._is_env_ready = True
+    # -----------------------
+    # Main Experiment Runner
+    # -----------------------
+    def run_exp(self, should_calc_metrics=True, reload_env=False, *args, **kwargs):
         """
-        Get the metric configuration.
-        This method should be implemented in subclasses.
+        Run the whole experiment pipeline.
+        :param reload_env: If True, forces dataset/general init to run again.
+        :param should_calc_metrics: Whether to calculate and save metrics after execution.
+        :kwargs Params:
+            + 'outfile' to save csv file results,
+            + 'outdir' to set output directory for experiment results.
+            + 'return_df' to return a DataFrame of results instead of a dictionary.
+        Full pipeline:
+            1. Init
+            2. Prepare Environment (General + Dataset + Metrics)
+            3. Save Config
+            4. Execute
+            5. Calculate & Save Metrics
         """
-        pass
+        self._prepare_environment(force_reload=reload_env)
+        self._trigger_hooks("before_run", self)
+        # Save config before running
+        self.config.save_to_outdir()
+        # Execute experiment
+        results = self.exec_exp(*args, **kwargs)
+        if should_calc_metrics and results is not None:
+            metrics_data, extra_data = self._validate_and_unpack(results)
+            # Calculate & Save metrics
+            perf_results = self.calc_perfs(
+                raw_metrics_data=metrics_data, extra_data=extra_data, *args, **kwargs
+            )
+            self._trigger_hooks("after_run", self, perf_results)
+            return perf_results
+        else:
+            self._trigger_hooks("after_run", self, results)
+            return results

halib/system/_list_pc.csv ADDED Viewed

@@ -0,0 +1,6 @@
+pc_name;abbr;working_disk
+DESKTOP-JQD9K01;MainPC;E:
+DESKTOP-5IRHU87;MSI_Laptop;D:
+DESKTOP-96HQCNO;4090_SV;E:
+DESKTOP-Q2IKLC0;4GPU_SV;D:
+DESKTOP-QNS3DNF;1GPU_SV;D:

halib/system/path.py CHANGED Viewed

@@ -3,28 +3,39 @@ from ..filetype import csvfile
 import pandas as pd
 import platform
 import re  # <--- [FIX 1] Added missing import
-PC_TO_ABBR = {
-    "DESKTOP-JQD9K01": "MainPC",
-    "DESKTOP-5IRHU87": "MSI_Laptop",
-    "DESKTOP-96HQCNO": "4090_SV",
-    "DESKTOP-Q2IKLC0": "4GPU_SV",
-    "DESKTOP-QNS3DNF": "1GPU_SV",
-}
-ABBR_DISK_MAP = {
-    "MainPC": "E:",
-    "MSI_Laptop": "D:",
-    "4090_SV": "E:",
-    "4GPU_SV": "D:",
-}
+import csv
+from importlib import resources
+PC_TO_ABBR = {}
+ABBR_DISK_MAP = {}
+pc_df = None
+cPlatform = platform.system().lower()
+def load_pc_meta_info():
+    # 1. Define the package where the file lives (dotted notation)
+    #    Since the file is in 'halib/system/', the package is 'halib.system'
+    package_name = "halib.system"
+    file_name = "_list_pc.csv"
+    # 2. Locate the file
+    csv_path = resources.files(package_name).joinpath(file_name)
+    global PC_TO_ABBR, ABBR_DISK_MAP, pc_df
+    pc_df = pd.read_csv(csv_path, sep=';', encoding='utf-8')
+    PC_TO_ABBR = dict(zip(pc_df['pc_name'], pc_df['abbr']))
+    ABBR_DISK_MAP = dict(zip(pc_df['abbr'], pc_df['working_disk']))
+    pprint("Loaded PC meta info:")
+    pprint(ABBR_DISK_MAP)
+    pprint(PC_TO_ABBR)
+# ! must be called at the module load time
+load_pc_meta_info()
 def list_PCs(show=True):
-    df = pd.DataFrame(list(PC_TO_ABBR.items()), columns=["PC Name", "Abbreviation"])
+    global pc_df
     if show:
-        csvfile.fn_display_df(df)
-    return df
+        csvfile.fn_display_df(pc_df)
+    return pc_df
 def get_PC_name():
@@ -44,11 +55,12 @@ def get_working_disk(abbr_disk_map=ABBR_DISK_MAP):
     pc_abbr = get_PC_abbr_name()
     return abbr_disk_map.get(pc_abbr, None)
+cDisk = get_working_disk()
 # ! This funcction search for full paths in the obj and normalize them according to the current platform and working disk
 # ! E.g: "E:/zdataset/DFire", but working_disk: "D:", current_platform: "windows" => "D:/zdataset/DFire"
 # ! E.g: "E:/zdataset/DFire", but working_disk: "D:", current_platform: "linux" => "/mnt/d/zdataset/DFire"
-def normalize_paths(obj, working_disk=None, current_platform=None):
+def normalize_paths(obj, working_disk=cDisk, current_platform=cPlatform):
     # [FIX 3] Resolve defaults inside function to be safer/cleaner
     if working_disk is None:
         working_disk = get_working_disk()

{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: halib
-Version: 0.2.8
+Version: 0.2.10
 Summary: Small library for common tasks
 Author: Hoang Van Ha
 Author-email: hoangvanhauit@gmail.com
@@ -53,7 +53,7 @@ Dynamic: summary
 # Helper package for coding and automation
-**Version 0.2.8**
+**Version 0.2.10**
 + reorganize packages with most changes in `research` package; also rename `research` to `exp` (package for experiment management and utilities)
 + update `exp/perfcalc.py` to allow save computed performance to csv file (without explicit calling method `calc_perfs`)

{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/RECORD RENAMED Viewed

@@ -22,7 +22,7 @@ halib/common/rich_color.py,sha256=tyK5fl3Dtv1tKsfFzt_5Rco4Fj72QliA-w5aGXaVuqQ,63
 halib/exp/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 halib/exp/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 halib/exp/core/base_config.py,sha256=Js2oVDt7qwT7eV_sOUWw6XXl569G1bX6ls-VYAx2gWY,5032
-halib/exp/core/base_exp.py,sha256=XjRHXbUHE-DCZLRDTteDF5gsxKN3mhGEe2zWL24JP80,5131
+halib/exp/core/base_exp.py,sha256=fknJVmW6ubbapOggbkrbNWgc1ZXcUz_FE3wMyuIGX7M,5180
 halib/exp/core/param_gen.py,sha256=I9JHrDCaep4CjvApDoX0QzFuw38zMC2PsDFueuA7pjM,4271
 halib/exp/core/wandb_op.py,sha256=powL2QyLBqF-6PUGAOqd60s1npHLLKJxPns3S4hKeNo,4160
 halib/exp/data/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -89,9 +89,10 @@ halib/sys/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 halib/sys/cmd.py,sha256=b2x7JPcNnFjLGheIESVYvqAb-w2UwBM1PAwYxMZ5YjA,228
 halib/sys/filesys.py,sha256=ERpnELLDKJoTIIKf-AajgkY62nID4qmqmX5TkE95APU,2931
 halib/system/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+halib/system/_list_pc.csv,sha256=IIQnC32RZ-j5uRS_C1HD0nvTlpxv-ItphZNmEns65iU,172
 halib/system/cmd.py,sha256=b2x7JPcNnFjLGheIESVYvqAb-w2UwBM1PAwYxMZ5YjA,228
 halib/system/filesys.py,sha256=102J2fkQhmH1_-HQVy2FQ4NOU8LTjMWV3hToT_APtq8,4401
-halib/system/path.py,sha256=uCXTltd943L_2heU2HLwvXcgYJRd8-ZEzDe435419OQ,3165
+halib/system/path.py,sha256=CvWMiGKtrqSq816W6rkiy6QRq3FGb4GWlnNkPZjIvnc,3688
 halib/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 halib/utils/dataclass_util.py,sha256=rj2IMLlUzbm2OlF5_B2dRTk9njZOaF7tTjYkOsq8uLY,1416
 halib/utils/dict.py,sha256=wYE6Iw-_CnCWdMg9tpJ2Y2-e2ESkW9FxmdBkZkbUh80,299
@@ -101,8 +102,8 @@ halib/utils/list.py,sha256=BM-8sRhYyqF7bh4p7TQtV7P_gnFruUCA6DTUOombaZg,337
 halib/utils/listop.py,sha256=Vpa8_2fI0wySpB2-8sfTBkyi_A4FhoFVVvFiuvW8N64,339
 halib/utils/tele_noti.py,sha256=-4WXZelCA4W9BroapkRyIdUu9cUVrcJJhegnMs_WpGU,5928
 halib/utils/video.py,sha256=zLoj5EHk4SmP9OnoHjO8mLbzPdtq6gQPzTQisOEDdO8,3261
-halib-0.2.8.dist-info/licenses/LICENSE.txt,sha256=qZssdna4aETiR8znYsShUjidu-U4jUT9Q-EWNlZ9yBQ,1100
-halib-0.2.8.dist-info/METADATA,sha256=QU-YIW5BNbgDy9j9ttQsleQ2zkBmWjpVazjjb23vIo8,6836
-halib-0.2.8.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-halib-0.2.8.dist-info/top_level.txt,sha256=7AD6PLaQTreE0Fn44mdZsoHBe_Zdd7GUmjsWPyQ7I-k,6
-halib-0.2.8.dist-info/RECORD,,
+halib-0.2.10.dist-info/licenses/LICENSE.txt,sha256=qZssdna4aETiR8znYsShUjidu-U4jUT9Q-EWNlZ9yBQ,1100
+halib-0.2.10.dist-info/METADATA,sha256=EEhbKj7cVxfoVEyOWZRkJZTSFg4esZFIVqwa0-Idnh0,6838
+halib-0.2.10.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+halib-0.2.10.dist-info/top_level.txt,sha256=7AD6PLaQTreE0Fn44mdZsoHBe_Zdd7GUmjsWPyQ7I-k,6
+halib-0.2.10.dist-info/RECORD,,

{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/WHEEL RENAMED Viewed

File without changes

{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/licenses/LICENSE.txt RENAMED Viewed

File without changes

{halib-0.2.8.dist-info → halib-0.2.10.dist-info}/top_level.txt RENAMED Viewed

File without changes

halib 0.2.8__py3-none-any.whl → 0.2.10__py3-none-any.whl

halib 0.2.8py3-none-any.whl → 0.2.10py3-none-any.whl