PyPI - omnigenome - Versions diffs - 0.3.0a0__py3-none-any.whl → 0.3.1a0__py3-none-any.whl - Mend

omnigenome 0.3.0a0py3-none-any.whl → 0.3.1a0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (73) hide show

omnigenome/__init__.py +29 -44
omnigenome/auto/auto_bench/__init__.py +0 -1
omnigenome/auto/auto_bench/auto_bench.py +24 -14
omnigenome/auto/auto_train/__init__.py +0 -1
omnigenome/auto/auto_train/auto_train.py +11 -12
omnigenome/auto/bench_hub/__init__.py +0 -1
omnigenome/auto/bench_hub/bench_hub.py +1 -1
omnigenome/cli/__init__.py +0 -1
omnigenome/cli/commands/__init__.py +0 -1
omnigenome/cli/commands/base.py +10 -10
omnigenome/cli/commands/bench/__init__.py +0 -1
omnigenome/cli/commands/bench/bench_cli.py +10 -10
omnigenome/cli/commands/rna/__init__.py +0 -1
omnigenome/cli/commands/rna/rna_design.py +10 -11
omnigenome/src/__init__.py +0 -1
omnigenome/src/abc/__init__.py +0 -1
omnigenome/src/abc/abstract_dataset.py +38 -19
omnigenome/src/abc/abstract_metric.py +7 -7
omnigenome/src/abc/abstract_model.py +15 -14
omnigenome/src/abc/abstract_tokenizer.py +9 -7
omnigenome/src/dataset/omni_dataset.py +16 -14
omnigenome/src/lora/__init__.py +0 -1
omnigenome/src/lora/lora_model.py +47 -41
omnigenome/src/metric/classification_metric.py +11 -11
omnigenome/src/metric/metric.py +19 -19
omnigenome/src/metric/ranking_metric.py +15 -15
omnigenome/src/metric/regression_metric.py +18 -18
omnigenome/src/misc/utils.py +214 -150
omnigenome/src/model/augmentation/__init__.py +0 -1
omnigenome/src/model/augmentation/model.py +17 -17
omnigenome/src/model/classification/__init__.py +0 -1
omnigenome/src/model/classification/model.py +28 -32
omnigenome/src/model/embedding/__init__.py +0 -1
omnigenome/src/model/embedding/model.py +35 -35
omnigenome/src/model/mlm/__init__.py +0 -1
omnigenome/src/model/mlm/model.py +13 -13
omnigenome/src/model/module_utils.py +17 -17
omnigenome/src/model/regression/__init__.py +0 -1
omnigenome/src/model/regression/model.py +72 -77
omnigenome/src/model/regression/resnet.py +32 -32
omnigenome/src/model/rna_design/__init__.py +0 -1
omnigenome/src/model/rna_design/model.py +168 -118
omnigenome/src/model/seq2seq/__init__.py +0 -1
omnigenome/src/model/seq2seq/model.py +4 -4
omnigenome/src/tokenizer/bpe_tokenizer.py +27 -27
omnigenome/src/tokenizer/kmers_tokenizer.py +22 -22
omnigenome/src/tokenizer/single_nucleotide_tokenizer.py +11 -11
omnigenome/src/trainer/accelerate_trainer.py +40 -32
omnigenome/src/trainer/hf_trainer.py +8 -8
omnigenome/src/trainer/trainer.py +37 -25
omnigenome/utility/dataset_hub/__init__.py +0 -1
omnigenome/utility/dataset_hub/dataset_hub.py +13 -13
omnigenome/utility/ensemble.py +26 -26
omnigenome/utility/hub_utils.py +8 -8
omnigenome/utility/model_hub/__init__.py +0 -1
omnigenome/utility/model_hub/model_hub.py +26 -25
omnigenome/utility/pipeline_hub/__init__.py +0 -1
omnigenome/utility/pipeline_hub/pipeline.py +49 -49
omnigenome/utility/pipeline_hub/pipeline_hub.py +17 -17
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/METADATA +3 -3
omnigenome-0.3.1a0.dist-info/RECORD +78 -0
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/top_level.txt +0 -1
omnigenome-0.3.0a0.dist-info/RECORD +0 -85
tests/__init__.py +0 -9
tests/conftest.py +0 -160
tests/test_dataset_patterns.py +0 -291
tests/test_examples_syntax.py +0 -83
tests/test_model_loading.py +0 -183
tests/test_rna_functions.py +0 -255
tests/test_training_patterns.py +0 -302
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/WHEEL +0 -0
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/entry_points.txt +0 -0
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/licenses/LICENSE +0 -0

omnigenome/src/metric/regression_metric.py CHANGED Viewed

@@ -20,20 +20,20 @@ from ..abc.abstract_metric import OmniMetric
 def mcrmse(y_true, y_pred):
     """
     Compute Mean Column Root Mean Square Error (MCRMSE).
     MCRMSE is a multi-target regression metric that computes the RMSE for each target
     column and then takes the mean across all targets.
     Args:
         y_true (np.ndarray): Ground truth values with shape (n_samples, n_targets)
         y_pred (np.ndarray): Predicted values with shape (n_samples, n_targets)
     Returns:
         float: Mean Column Root Mean Square Error
     Raises:
         ValueError: If y_true and y_pred have different shapes
     Example:
         >>> y_true = np.array([[1, 2], [3, 4], [5, 6]])
         >>> y_pred = np.array([[1.1, 2.1], [2.9, 4.1], [5.2, 5.8]])
@@ -56,18 +56,18 @@ setattr(metrics, "mcrmse", mcrmse)
 class RegressionMetric(OmniMetric):
     """
     A specialized metric class for regression tasks and evaluation.
     This class provides access to regression-specific metrics from scikit-learn
     and handles different input formats including HuggingFace trainer outputs.
     It dynamically wraps scikit-learn metrics and provides a unified interface
     for computing various regression evaluation metrics.
     Attributes:
         metric_func: Custom metric function if provided
         ignore_y: Value to ignore in predictions and true values
         kwargs: Additional keyword arguments for metric computation
         metrics: Dictionary of available metrics including custom ones
     Example:
         >>> from omnigenome.src.metric import RegressionMetric
         >>> metric = RegressionMetric(ignore_y=-100)
@@ -81,7 +81,7 @@ class RegressionMetric(OmniMetric):
     def __init__(self, metric_func=None, ignore_y=-100, *args, **kwargs):
         """
         Initialize the RegressionMetric class.
         Args:
             metric_func (callable, optional): Custom metric function to use
             ignore_y (int, optional): Value to ignore in predictions and true values. Defaults to -100
@@ -97,14 +97,14 @@ class RegressionMetric(OmniMetric):
     def __getattribute__(self, name):
         """
         Dynamically create regression metric computation methods.
         This method intercepts attribute access and creates wrapper functions
         for scikit-learn regression metrics, handling different input formats and
         preprocessing the data appropriately.
         Args:
             name (str): Name of the regression metric to access
         Returns:
             callable: Wrapper function for the requested regression metric
         """
@@ -118,17 +118,17 @@ class RegressionMetric(OmniMetric):
             def wrapper(y_true=None, y_score=None, *args, **kwargs):
                 """
                 Compute the regression metric, based on the true and predicted values.
                 This wrapper handles different input formats including HuggingFace
                 trainer outputs and performs necessary preprocessing for regression tasks.
                 Args:
                     y_true: The true values or HuggingFace EvalPrediction object
                     y_score: The predicted values
                     ignore_y: The value to ignore in the predictions and true values in corresponding positions
                     *args: Additional positional arguments for the metric
                     **kwargs: Additional keyword arguments for the metric
                 Returns:
                     dict: Dictionary containing the metric name and computed value
                 """
@@ -168,16 +168,16 @@ class RegressionMetric(OmniMetric):
     def compute(self, y_true, y_score, *args, **kwargs):
         """
         Compute the regression metric, based on the true and predicted values.
         Args:
             y_true: The true values
             y_score: The predicted values
             *args: Additional positional arguments for the metric
             **kwargs: Additional keyword arguments for the metric
         Returns:
             The computed regression metric value
         Raises:
             NotImplementedError: If no metric function is provided and compute is not implemented
         """

omnigenome/src/misc/utils.py CHANGED Viewed

@@ -12,6 +12,7 @@ import pickle
 import sys
 import tempfile
 import time
+import warnings
 import ViennaRNA as RNA
 import findfile
@@ -24,13 +25,13 @@ default_omnigenome_repo = (
 def seed_everything(seed=42):
     """
     Sets random seeds for reproducibility across all random number generators.
     This function sets seeds for Python's random module, NumPy, PyTorch (CPU and CUDA),
     and sets the PYTHONHASHSEED environment variable to ensure reproducible results
     across different runs.
     Args:
-        seed (int): The seed value to use for all random number generators.
+        seed (int): The seed value to use for all random number generators.
                    Defaults to 42.
     Example:
@@ -48,58 +49,50 @@ def seed_everything(seed=42):
     torch.manual_seed(seed)
     torch.cuda.manual_seed(seed)
     torch.backends.cudnn.deterministic = True
+    torch.backends.cudnn.benchmark = False
 class RNA2StructureCache(dict):
     """
-    A cache for RNA sequence to structure predictions using ViennaRNA.
-    This class provides a dictionary-like interface for caching RNA secondary
-    structure predictions. It uses ViennaRNA for structure prediction and
-    supports both single sequences and batches of sequences.
-    The cache can be persisted to disk and loaded back, making it useful for
-    avoiding redundant structure predictions across multiple runs.
+    A cache for RNA secondary structure predictions using ViennaRNA.
+    This class provides a caching mechanism for RNA secondary structure predictions
+    to avoid redundant computations. It supports both single sequence and batch
+    processing with optional multiprocessing for improved performance.
     Attributes:
-        cache_file (str): Path to the cache file on disk.
-        cache (dict): The in-memory cache dictionary.
-        queue_num (int): Counter for tracking cache updates.
+        cache (dict): Dictionary storing sequence-structure mappings
+        cache_file (str): Path to the cache file on disk
+        queue_num (int): Counter for tracking cache updates
     """
     def __init__(self, cache_file=None, *args, **kwargs):
         """
-        Initializes the RNA structure cache.
+        Initialize the RNA structure cache.
         Args:
             cache_file (str, optional): Path to the cache file. If None, uses
-                                      a default path in `__OMNIGENOME_DATA__`.
-            *args: Additional arguments passed to dict constructor.
-            **kwargs: Additional keyword arguments passed to dict constructor.
-        Example:
-            >>> # Initialize with default cache file
-            >>> cache = RNA2StructureCache()
-            >>> # Initialize with custom cache file
-            >>> cache = RNA2StructureCache("my_cache.pkl")
+                                      a default temporary file.
+            *args: Additional positional arguments for dict initialization
+            **kwargs: Additional keyword arguments for dict initialization
         """
         super().__init__(*args, **kwargs)
-        if not cache_file:
-            self.cache_file = "__OMNIGENOME_DATA__/rna2structure.cache.pkl"
-        else:
-            self.cache_file = cache_file
-        if self.cache_file is None or not os.path.exists(self.cache_file):
-            self.cache = {}
-        else:
-            fprint(f"Initialize sequence to structure cache from {self.cache_file}...")
-            with open(self.cache_file, "rb") as f:
-                self.cache = pickle.load(f)
+        self.cache = dict(*args, **kwargs)
+        self.cache_file = (
+            cache_file
+            if cache_file is not None
+            else os.path.join(tempfile.gettempdir(), "rna_structure_cache.pkl")
+        )
         self.queue_num = 0
+        # Load existing cache if available
+        if os.path.exists(self.cache_file):
+            try:
+                with open(self.cache_file, "rb") as f:
+                    self.cache.update(pickle.load(f))
+            except Exception as e:
+                warnings.warn(f"Failed to load cache file: {e}")
     def __getitem__(self, key):
         """Gets a cached structure prediction."""
         return self.cache[key]
@@ -116,15 +109,31 @@ class RNA2StructureCache(dict):
         """String representation of the cache."""
         return str(self.cache)
+    def _fold_single_sequence(self, sequence):
+        """
+        Predict structure for a single sequence (worker function for multiprocessing).
+        Args:
+            sequence (str): RNA sequence to fold
+        Returns:
+            tuple: (structure, mfe) tuple
+        """
+        try:
+            return RNA.fold(sequence)
+        except Exception as e:
+            warnings.warn(f"Failed to fold sequence {sequence}: {e}")
+            return ("." * len(sequence), 0.0)
     def fold(self, sequence, return_mfe=False, num_workers=1):
         """
         Predicts RNA secondary structure for given sequences.
         This method predicts RNA secondary structures using ViennaRNA. It supports
         both single sequences and batches of sequences. The method uses caching
         to avoid redundant predictions and supports multiprocessing for batch
         processing on non-Windows systems.
         Args:
             sequence (str or list): A single RNA sequence or a list of sequences.
             return_mfe (bool): Whether to return minimum free energy along with
@@ -141,7 +150,7 @@ class RNA2StructureCache(dict):
             >>> # Predict structure for a single sequence
             >>> structure = cache.fold("GGGAAAUCC")
             >>> print(structure)  # "(((...)))"
             >>> # Predict structures for multiple sequences
             >>> structures = cache.fold(["GGGAAAUCC", "AUUGCUAA"])
             >>> print(structures)  # ["(((...)))", "........"]
@@ -151,39 +160,62 @@ class RNA2StructureCache(dict):
         else:
             sequences = sequence
-        if (
-            os.name != "nt" and len(sequences) > 1
-        ):  # multiprocessing is not working on Windows in my case
-            num_workers = min(os.cpu_count(), len(sequences))
+        # Determine if we should use multiprocessing
+        use_multiprocessing = (
+            os.name != "nt"  # Not Windows
+            and len(sequences) > 1  # Multiple sequences
+            and num_workers > 1  # Multiple workers requested
+        )
-        structures = []
+        # Find sequences that need prediction
+        sequences_to_predict = [seq for seq in sequences if seq not in self.cache]
-        if not all([seq in self.cache for seq in sequences]):
-            if num_workers == 1:
-                for seq in sequences:
-                    if seq not in self.cache:
-                        self.queue_num += 1
-                        self.cache[seq] = RNA.fold(seq)
-            else:
+        if sequences_to_predict:
+            if use_multiprocessing:
+                # Use multiprocessing for batch prediction
                 if num_workers is None:
-                    num_workers = min(os.cpu_count(), len(sequences))
-                with multiprocessing.Pool(num_workers) as pool:
-                    for seq in sequences:
-                        if seq not in self.cache:
+                    num_workers = min(os.cpu_count(), len(sequences_to_predict))
+                try:
+                    # Set multiprocessing start method to 'spawn' for better compatibility
+                    if multiprocessing.get_start_method(allow_none=True) != "spawn":
+                        multiprocessing.set_start_method("spawn", force=True)
+                    with multiprocessing.Pool(num_workers) as pool:
+                        # Use map instead of apply_async for better error handling
+                        results = pool.map(
+                            self._fold_single_sequence, sequences_to_predict
+                        )
+                        # Update cache with results
+                        for seq, result in zip(sequences_to_predict, results):
+                            self.cache[seq] = result
                             self.queue_num += 1
-                            async_result = pool.apply_async(RNA.fold, args=(seq,))
-                            structures.append((seq, async_result))
-                    for seq, result in structures:
-                        self.cache[seq] = result.get()  # result is a tuple
+                except Exception as e:
+                    warnings.warn(
+                        f"Multiprocessing failed, falling back to sequential: {e}"
+                    )
+                    # Fallback to sequential processing
+                    for seq in sequences_to_predict:
+                        self.cache[seq] = self._fold_single_sequence(seq)
+                        self.queue_num += 1
+            else:
+                # Sequential processing
+                for seq in sequences_to_predict:
+                    self.cache[seq] = self._fold_single_sequence(seq)
+                    self.queue_num += 1
+        # Prepare output
         if return_mfe:
             structures = [self.cache[seq] for seq in sequences]
         else:
             structures = [self.cache[seq][0] for seq in sequences]
+        # Update cache file periodically
         self.update_cache_file(self.cache_file)
+        # Return single result or list
         if len(structures) == 1:
             return structures[0]
         else:
@@ -192,10 +224,10 @@ class RNA2StructureCache(dict):
     def update_cache_file(self, cache_file=None):
         """
         Updates the cache file on disk.
         This method saves the in-memory cache to disk. It only saves when
         the queue_num reaches 100 to avoid excessive disk I/O.
         Args:
             cache_file (str, optional): Path to the cache file. If None, uses
                                       the instance's cache_file.
@@ -209,24 +241,26 @@ class RNA2StructureCache(dict):
         if cache_file is None:
             cache_file = self.cache_file
-        if not os.path.exists(os.path.dirname(cache_file)):
-            os.makedirs(os.path.dirname(cache_file))
+        try:
+            if not os.path.exists(os.path.dirname(cache_file)):
+                os.makedirs(os.path.dirname(cache_file))
-        # print(f"Updating cache file {cache_file}...")
-        with open(cache_file, "wb") as f:
-            pickle.dump(self.cache, f)
+            with open(cache_file, "wb") as f:
+                pickle.dump(self.cache, f)
-        self.queue_num = 0
+            self.queue_num = 0
+        except Exception as e:
+            warnings.warn(f"Failed to update cache file: {e}")
 def env_meta_info():
     """
     Collects metadata about the current environment and library versions.
     This function gathers information about the current Python environment,
     including versions of key libraries like PyTorch and Transformers,
     as well as OmniGenome version information.
     Returns:
         dict: A dictionary containing environment metadata including:
               - library_name: Name of the OmniGenome library
@@ -256,7 +290,7 @@ def env_meta_info():
 def naive_secondary_structure_repair(sequence, structure):
     """
     Repair the secondary structure of a sequence.
     This function attempts to repair malformed RNA secondary structure
     representations by ensuring proper bracket matching. It handles
     common issues like unmatched brackets by converting them to dots.
@@ -294,7 +328,7 @@ def naive_secondary_structure_repair(sequence, structure):
 def save_args(config, save_path):
     """
     Save arguments to a file.
     This function saves the arguments from a configuration object to a text file.
     It's useful for logging experiment parameters and configurations.
@@ -317,7 +351,7 @@ def save_args(config, save_path):
 def print_args(config, logger=None):
     """
     Print the arguments to the console.
     This function prints the arguments from a configuration object to the console
     or a logger. It's useful for debugging and logging experiment parameters.
@@ -330,110 +364,140 @@ def print_args(config, logger=None):
         >>> config = Namespace(learning_rate=0.001, batch_size=32)
         >>> print_args(config)
     """
-    args = [key for key in sorted(config.args.keys())]
-    if logger:
-        logger.info(args)
+    if logger is None:
+        for arg in config.args:
+            if config.args_call_count[arg]:
+                print("{}: {}".format(arg, config.args[arg]))
     else:
-        fprint(args)
+        for arg in config.args:
+            if config.args_call_count[arg]:
+                logger.info("{}: {}".format(arg, config.args[arg]))
 def fprint(*objects, sep=" ", end="\n", file=sys.stdout, flush=False):
     """
-    Custom print function that adds a timestamp and the pyabsa version before the printed message.
+    Enhanced print function with automatic flushing.
+    This function provides a print-like interface with automatic flushing
+    to ensure output is displayed immediately. It's useful for real-time
+    logging and progress tracking.
     Args:
-        *objects: Any number of objects to be printed
-        sep (str, optional): Separator between objects. Defaults to " ".
-        end (str, optional): Ending character after all objects are printed. Defaults to "\n".
-        file (io.TextIOWrapper, optional): Text file to write printed output to. Defaults to sys.stdout.
-        flush (bool, optional): Whether to flush output buffer after printing. Defaults to False.
+        *objects: Objects to print
+        sep (str): Separator between objects (default: " ")
+        end (str): String appended after the last value (default: "\n")
+        file: File-like object to write to (default: sys.stdout)
+        flush (bool): Whether to flush the stream (default: False)
+    Example:
+        >>> fprint("Training started...", flush=True)
+        >>> fprint("Epoch 1/10", "Loss: 0.5", sep=" | ")
     """
-    from omnigenome import __version__
-    from omnigenome import __name__
-    print(
-        time.strftime(
-            "[%Y-%m-%d %H:%M:%S] [{} {}] ".format(__name__, __version__),
-            time.localtime(time.time()),
-        ),
-        *objects,
-        sep=sep,
-        end=end,
-        file=file,
-        flush=flush,
-    )
+    print(*objects, sep=sep, end=end, file=file, flush=True)
 def clean_temp_checkpoint(days_threshold=7):
     """
-    删除超过指定时间的 checkpoint 文件。
+    Clean up temporary checkpoint files older than specified days.
+    This function removes temporary checkpoint files that are older than
+    the specified threshold to free up disk space.
+    Args:
+        days_threshold (int): Number of days after which files are considered old.
+                            Defaults to 7.
-    参数：
-    - directory (str): 文件所在的目录路径。
-    - file_extension (str): checkpoint 文件的扩展名，默认是 ".ckpt"。
-    - days_threshold (int): 超过多少天的文件将被删除，默认是 7 天。
+    Example:
+        >>> clean_temp_checkpoint(3)  # Remove files older than 3 days
     """
-    # 获取当前时间
-    import os
-    from datetime import datetime, timedelta
-    current_time = datetime.now()
-    ckpt_files = findfile.find_cwd_files(["tmp_ckpt", ".pt"])
-    # 遍历目录中的所有文件
-    for file_path in ckpt_files:
-        # 获取文件的最后修改时间
-        file_mod_time = datetime.fromtimestamp(os.path.getmtime(file_path))
-        # 计算文件是否超过指定的时间阈值
-        if current_time - file_mod_time > timedelta(days=days_threshold):
+    import glob
+    import time
+    temp_patterns = [
+        "temp_checkpoint_*",
+        "checkpoint_*",
+        "*.tmp",
+        "*.temp",
+    ]
+    current_time = time.time()
+    threshold_time = current_time - (days_threshold * 24 * 60 * 60)
+    for pattern in temp_patterns:
+        for file_path in glob.glob(pattern):
             try:
-                # 删除文件
-                os.remove(file_path)
-                print(f"Deleted: {file_path}")
-            except Exception as e:
-                print(f"Error deleting {file_path}: {e}")
+                if os.path.getmtime(file_path) < threshold_time:
+                    os.remove(file_path)
+            except Exception:
+                pass
 def load_module_from_path(module_name, file_path):
-    import importlib
+    """
+    Load a Python module from a file path.
+    This function dynamically loads a Python module from a file path,
+    useful for loading configuration files or custom modules.
+    Args:
+        module_name (str): Name to assign to the loaded module
+        file_path (str): Path to the Python file to load
+    Returns:
+        module: The loaded module object
+    Example:
+        >>> config = load_module_from_path("config", "config.py")
+        >>> print(config.some_variable)
+    """
+    import importlib.util
     spec = importlib.util.spec_from_file_location(module_name, file_path)
     module = importlib.util.module_from_spec(spec)
-    try:
-        spec.loader.exec_module(module)
-    except FileNotFoundError:
-        raise ImportError(f"Cannot find the module {module_name} from {file_path}.")
+    spec.loader.exec_module(module)
     return module
 def check_bench_version(bench_version, omnigenome_version):
-    assert (
-        bench_version is not None
-    ), "Benchmark metadata does not contain a valid __omnigenome__ version."
+    """
+    Check if benchmark version is compatible with OmniGenome version.
-    if not isinstance(bench_version, (int, float, str)):
-        raise TypeError(
-            f"Invalid type for benchmark version. Expected int, float, or str but got {type(bench_version).__name__}."
-        )
+    This function compares the benchmark version with the OmniGenome version
+    to ensure compatibility and warns if there are potential issues.
-    assert (
-        omnigenome_version is not None
-    ), "AutoBench is missing a valid omnigenome version."
+    Args:
+        bench_version (str): Version of the benchmark
+        omnigenome_version (str): Version of OmniGenome
-    if bench_version > omnigenome_version:
-        raise ValueError(
-            f"AutoBench version {omnigenome_version} is not compatible with the benchmark version "
-            f"{bench_version}. Please update the benchmark or AutoBench."
+    Example:
+        >>> check_bench_version("0.2.0", "0.3.0")
+    """
+    if bench_version != omnigenome_version:
+        warnings.warn(
+            f"Benchmark version ({bench_version}) differs from "
+            f"OmniGenome version ({omnigenome_version}). "
+            f"This may cause compatibility issues."
         )
 def clean_temp_dir_pt_files():
-    tmp_dir = tempfile.gettempdir()
-    for f in os.listdir(tmp_dir):
-        if f.endswith(".pt") and f.startswith("tmp_ckpt"):
-            path = os.path.join(tmp_dir, f)
+    """
+    Clean up temporary PyTorch files in the current directory.
+    This function removes temporary PyTorch files (like .pt, .pth files)
+    that may be left over from previous runs.
+    Example:
+        >>> clean_temp_dir_pt_files()
+    """
+    import glob
+    temp_patterns = ["*.pt", "*.pth", "temp_*", "checkpoint_*"]
+    for pattern in temp_patterns:
+        for file_path in glob.glob(pattern):
             try:
-                os.remove(path)
-                print(f"Removed: {path}")
-            except Exception as e:
-                print(f"Failed to remove {path}: {e}")
+                if os.path.isfile(file_path):
+                    os.remove(file_path)
+            except Exception:
+                pass

omnigenome/src/model/augmentation/__init__.py CHANGED Viewed

@@ -9,4 +9,3 @@
 """
 This package contains modules for data augmentation.
 """

omnigenome 0.3.0a0__py3-none-any.whl → 0.3.1a0__py3-none-any.whl

omnigenome 0.3.0a0py3-none-any.whl → 0.3.1a0py3-none-any.whl