PyPI - omnigenome - Versions diffs - 0.3.0a0__py3-none-any.whl → 0.3.1a0__py3-none-any.whl - Mend

omnigenome 0.3.0a0py3-none-any.whl → 0.3.1a0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (73) hide show

omnigenome/__init__.py +29 -44
omnigenome/auto/auto_bench/__init__.py +0 -1
omnigenome/auto/auto_bench/auto_bench.py +24 -14
omnigenome/auto/auto_train/__init__.py +0 -1
omnigenome/auto/auto_train/auto_train.py +11 -12
omnigenome/auto/bench_hub/__init__.py +0 -1
omnigenome/auto/bench_hub/bench_hub.py +1 -1
omnigenome/cli/__init__.py +0 -1
omnigenome/cli/commands/__init__.py +0 -1
omnigenome/cli/commands/base.py +10 -10
omnigenome/cli/commands/bench/__init__.py +0 -1
omnigenome/cli/commands/bench/bench_cli.py +10 -10
omnigenome/cli/commands/rna/__init__.py +0 -1
omnigenome/cli/commands/rna/rna_design.py +10 -11
omnigenome/src/__init__.py +0 -1
omnigenome/src/abc/__init__.py +0 -1
omnigenome/src/abc/abstract_dataset.py +38 -19
omnigenome/src/abc/abstract_metric.py +7 -7
omnigenome/src/abc/abstract_model.py +15 -14
omnigenome/src/abc/abstract_tokenizer.py +9 -7
omnigenome/src/dataset/omni_dataset.py +16 -14
omnigenome/src/lora/__init__.py +0 -1
omnigenome/src/lora/lora_model.py +47 -41
omnigenome/src/metric/classification_metric.py +11 -11
omnigenome/src/metric/metric.py +19 -19
omnigenome/src/metric/ranking_metric.py +15 -15
omnigenome/src/metric/regression_metric.py +18 -18
omnigenome/src/misc/utils.py +214 -150
omnigenome/src/model/augmentation/__init__.py +0 -1
omnigenome/src/model/augmentation/model.py +17 -17
omnigenome/src/model/classification/__init__.py +0 -1
omnigenome/src/model/classification/model.py +28 -32
omnigenome/src/model/embedding/__init__.py +0 -1
omnigenome/src/model/embedding/model.py +35 -35
omnigenome/src/model/mlm/__init__.py +0 -1
omnigenome/src/model/mlm/model.py +13 -13
omnigenome/src/model/module_utils.py +17 -17
omnigenome/src/model/regression/__init__.py +0 -1
omnigenome/src/model/regression/model.py +72 -77
omnigenome/src/model/regression/resnet.py +32 -32
omnigenome/src/model/rna_design/__init__.py +0 -1
omnigenome/src/model/rna_design/model.py +168 -118
omnigenome/src/model/seq2seq/__init__.py +0 -1
omnigenome/src/model/seq2seq/model.py +4 -4
omnigenome/src/tokenizer/bpe_tokenizer.py +27 -27
omnigenome/src/tokenizer/kmers_tokenizer.py +22 -22
omnigenome/src/tokenizer/single_nucleotide_tokenizer.py +11 -11
omnigenome/src/trainer/accelerate_trainer.py +40 -32
omnigenome/src/trainer/hf_trainer.py +8 -8
omnigenome/src/trainer/trainer.py +37 -25
omnigenome/utility/dataset_hub/__init__.py +0 -1
omnigenome/utility/dataset_hub/dataset_hub.py +13 -13
omnigenome/utility/ensemble.py +26 -26
omnigenome/utility/hub_utils.py +8 -8
omnigenome/utility/model_hub/__init__.py +0 -1
omnigenome/utility/model_hub/model_hub.py +26 -25
omnigenome/utility/pipeline_hub/__init__.py +0 -1
omnigenome/utility/pipeline_hub/pipeline.py +49 -49
omnigenome/utility/pipeline_hub/pipeline_hub.py +17 -17
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/METADATA +3 -3
omnigenome-0.3.1a0.dist-info/RECORD +78 -0
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/top_level.txt +0 -1
omnigenome-0.3.0a0.dist-info/RECORD +0 -85
tests/__init__.py +0 -9
tests/conftest.py +0 -160
tests/test_dataset_patterns.py +0 -291
tests/test_examples_syntax.py +0 -83
tests/test_model_loading.py +0 -183
tests/test_rna_functions.py +0 -255
tests/test_training_patterns.py +0 -302
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/WHEEL +0 -0
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/entry_points.txt +0 -0
{omnigenome-0.3.0a0.dist-info → omnigenome-0.3.1a0.dist-info}/licenses/LICENSE +0 -0

omnigenome/src/model/rna_design/model.py CHANGED Viewed

@@ -18,9 +18,11 @@ import numpy as np
 import torch
 import autocuda
 from transformers import AutoModelForMaskedLM, AutoTokenizer
-from concurrent.futures import ProcessPoolExecutor
+from concurrent.futures import ProcessPoolExecutor, as_completed
 import ViennaRNA
 from scipy.spatial.distance import hamming
+import warnings
+import os
 from omnigenome.src.misc.utils import fprint
@@ -28,19 +30,19 @@ from omnigenome.src.misc.utils import fprint
 class OmniModelForRNADesign(torch.nn.Module):
     """
     RNA design model using masked language modeling and evolutionary algorithms.
     This model combines a pre-trained masked language model with evolutionary
     algorithms to design RNA sequences that fold into specific target structures.
     It uses a multi-objective optimization approach to balance structure similarity
     and thermodynamic stability.
     Attributes:
         device: Device to run the model on (CPU or GPU)
         parallel: Whether to use parallel processing for structure prediction
         tokenizer: Tokenizer for processing RNA sequences
         model: Pre-trained masked language model
     """
     def __init__(
         self,
         model="yangheng/OmniGenome-186M",
@@ -51,7 +53,7 @@ class OmniModelForRNADesign(torch.nn.Module):
     ):
         """
         Initialize the RNA design model.
         Args:
             model (str): Model name or path for the pre-trained MLM model
             device: Device to run the model on (default: None, auto-detect)
@@ -70,164 +72,216 @@ class OmniModelForRNADesign(torch.nn.Module):
     def _random_bp_span(bp_span=None):
         """
         Generate a random base pair span.
         Args:
-            bp_span (int, optional): Base pair span to center around (default: None)
+            bp_span (int, optional): Fixed base pair span. If None, generates random.
         Returns:
-            int: Random base pair span within ±50 of the input span
+            int: Base pair span value
         """
-        return random.choice(range(max(0, bp_span - 50), min(bp_span + 50, 400)))
+        if bp_span is None:
+            return random.randint(1, 10)
+        return bp_span
     @staticmethod
     def _longest_bp_span(structure):
         """
-        Compute the longest base-pair span from RNA structure.
+        Find the longest base pair span in the structure.
         Args:
             structure (str): RNA structure in dot-bracket notation
         Returns:
-            int: Length of the longest base-pair span
+            int: Length of the longest base pair span
         """
-        stack = []
         max_span = 0
-        for i, char in enumerate(structure):
+        current_span = 0
+        for char in structure:
             if char == "(":
-                stack.append(i)
-            elif char == ")" and stack:
-                left_index = stack.pop()
-                max_span = max(max_span, i - left_index)
+                current_span += 1
+                max_span = max(max_span, current_span)
+            elif char == ")":
+                current_span = max(0, current_span - 1)
+            else:
+                current_span = 0
         return max_span
     @staticmethod
     def _predict_structure_single(sequence, bp_span=-1):
         """
-        Predict the RNA structure and minimum free energy (MFE) for a single sequence.
+        Predict structure for a single sequence (worker function for multiprocessing).
         Args:
-            sequence (str): RNA sequence
-            bp_span (int): Maximum base pair span for folding (default: -1, no limit)
+            sequence (str): RNA sequence to fold
+            bp_span (int): Base pair span parameter
         Returns:
-            tuple: (structure, mfe) where structure is in dot-bracket notation
+            tuple: (structure, mfe) tuple
         """
-        md = ViennaRNA.md()
-        md.max_bp_span = bp_span
-        fc = ViennaRNA.fold_compound(sequence, md)
-        return fc.mfe()
+        try:
+            return ViennaRNA.fold(sequence)
+        except Exception as e:
+            warnings.warn(f"Failed to fold sequence {sequence}: {e}")
+            return ("." * len(sequence), 0.0)
     def _predict_structure(self, sequences, bp_span=-1):
         """
-        Predict RNA structures for multiple sequences.
+        Predict structures for multiple sequences.
         Args:
             sequences (list): List of RNA sequences
-            bp_span (int): Maximum base pair span for folding (default: -1, no limit)
+            bp_span (int): Base pair span parameter
         Returns:
             list: List of (structure, mfe) tuples
         """
-        return [self._predict_structure_single(seq, bp_span) for seq in sequences]
+        if not self.parallel or len(sequences) <= 1:
+            # Sequential processing
+            return [self._predict_structure_single(seq, bp_span) for seq in sequences]
+        # Parallel processing with improved error handling
+        try:
+            # Determine number of workers
+            max_workers = min(os.cpu_count(), len(sequences), 8)  # Limit to 8 workers
+            with ProcessPoolExecutor(max_workers=max_workers) as executor:
+                # Submit all tasks
+                future_to_seq = {
+                    executor.submit(self._predict_structure_single, seq, bp_span): seq
+                    for seq in sequences
+                }
+                # Collect results
+                results = []
+                for future in as_completed(future_to_seq):
+                    try:
+                        result = future.result()
+                        results.append(result)
+                    except Exception as e:
+                        seq = future_to_seq[future]
+                        warnings.warn(f"Failed to process sequence {seq}: {e}")
+                        # Fallback to dot structure
+                        results.append(("." * len(seq), 0.0))
+                return results
+        except Exception as e:
+            warnings.warn(
+                f"Parallel processing failed, falling back to sequential: {e}"
+            )
+            # Fallback to sequential processing
+            return [self._predict_structure_single(seq, bp_span) for seq in sequences]
     def _init_population(self, structure, num_population):
         """
-        Initialize the population with masked sequences.
+        Initialize the population with random sequences.
         Args:
-            structure (str): Target RNA structure in dot-bracket notation
-            num_population (int): Number of individuals in the population
+            structure (str): Target RNA structure
+            num_population (int): Population size
         Returns:
-            list: List of (sequence, bp_span) tuples representing the initial population
+            list: List of (sequence, bp_span) tuples
         """
         population = []
-        mlm_inputs = []
-        for _ in range(num_population):
-            masked_sequence = "".join(
-                [random.choice(["G", "C", "<mask>"]) for _ in structure]
-            )
-            mlm_inputs.append(f"{masked_sequence}<eos>{structure}")
-        outputs = self._mlm_predict(mlm_inputs, structure)
+        bp_span = self._longest_bp_span(structure)
-        for i, output in enumerate(outputs):
-            sequence = self.tokenizer.convert_ids_to_tokens(output.tolist())
-            fixed_sequence = [
-                x if x in "AGCT" else random.choice(["A", "T", "G", "C"])
-                for x in sequence
-            ]
-            bp_span = self._random_bp_span(len(structure))
-            population.append(("".join(fixed_sequence), bp_span))
+        for _ in range(num_population):
+            # Generate random sequence
+            sequence = "".join(random.choice("ACGU") for _ in range(len(structure)))
+            population.append((sequence, bp_span))
         return population
     def _mlm_mutate(self, population, structure, mutation_ratio):
         """
-        Apply mutation to the population using the masked language model (MLM).
+        Mutate population using masked language modeling.
         Args:
-            population (list): Current population of (sequence, bp_span) tuples
+            population (list): Current population
             structure (str): Target RNA structure
             mutation_ratio (float): Ratio of tokens to mutate
         Returns:
-            list: Mutated population of (sequence, bp_span) tuples
+            list: Mutated population
         """
         def mutate(sequence, mutation_rate):
-            sequence = np.array(list(sequence))
-            masked_indices = np.random.rand(len(sequence)) < mutation_rate
-            sequence[masked_indices] = "$"
-            return "".join(sequence).replace("$", "<mask>")
+            # Create masked sequence
+            masked_sequence = list(sequence)
+            num_mutations = int(len(sequence) * mutation_rate)
+            mutation_positions = random.sample(range(len(sequence)), num_mutations)
-        mlm_inputs = []
-        for sequence, bp_span in population:
-            masked_sequence = mutate(sequence, mutation_ratio)
-            mlm_inputs.append(f"{masked_sequence}<eos>{structure}")
+            for pos in mutation_positions:
+                masked_sequence[pos] = self.tokenizer.mask_token
-        outputs = self._mlm_predict(mlm_inputs, structure)
+            return "".join(masked_sequence)
-        mut_population = []
-        for i, (seq, bp_span) in enumerate(population):
-            sequence = self.tokenizer.convert_ids_to_tokens(outputs[i].tolist())
-            fixed_sequence = [
-                x if x in "AGCT" else random.choice(["A", "T", "G", "C"])
-                for x in sequence
-            ]
-            bp_span = self._random_bp_span(bp_span)
-            mut_population.append(("".join(fixed_sequence), bp_span))
+        # Prepare inputs for MLM
+        mlm_inputs = []
+        for sequence, bp_span in population:
+            masked_seq = mutate(sequence, mutation_ratio)
+            mlm_inputs.append(masked_seq)
+        # Get predictions from MLM
+        predicted_tokens = self._mlm_predict(mlm_inputs, structure)
+        # Convert predictions back to sequences
+        mutated_population = []
+        for i, (sequence, bp_span) in enumerate(population):
+            # Convert token IDs back to nucleotides
+            new_sequence = self.tokenizer.decode(
+                predicted_tokens[i], skip_special_tokens=True
+            )
+            # Ensure the sequence has the correct length
+            if len(new_sequence) != len(structure):
+                new_sequence = new_sequence[: len(structure)].ljust(len(structure), "A")
+            mutated_population.append((new_sequence, bp_span))
-        return mut_population
+        return mutated_population
     def _crossover(self, population, num_points=3):
         """
-        Perform crossover operation to create offspring.
+        Perform crossover operation on the population.
         Args:
-            population (list): Current population of (sequence, bp_span) tuples
-            num_points (int): Number of crossover points (default: 3)
+            population (list): Current population
+            num_points (int): Number of crossover points
         Returns:
-            list: Offspring population after crossover
+            list: Population after crossover
         """
-        population_size = len(population)
-        sequence_length = len(population[0][0])
+        if len(population) < 2:
+            return population
+        # Create crossover masks
+        num_sequences = len(population)
+        masks = np.zeros((num_sequences, len(population[0][0])), dtype=bool)
-        parent_indices = np.random.choice(population_size // 10, (population_size, 2))
-        crossover_points = np.sort(
-            np.random.randint(1, sequence_length, size=(population_size, num_points)),
-            axis=1,
+        # Generate random crossover points
+        crossover_points = np.random.randint(
+            0, len(population[0][0]), (num_sequences, num_points)
         )
-        masks = np.zeros((population_size, sequence_length), dtype=bool)
-        for i in range(population_size):
-            last_point = 0
+        # Create parent indices
+        parent_indices = np.random.randint(0, num_sequences, (num_sequences, 2))
+        # Generate crossover masks
+        for i in range(num_sequences):
             for j in range(num_points):
-                masks[i, last_point : crossover_points[i, j]] = j % 2 == 0
-                last_point = crossover_points[i, j]
+                if j == 0:
+                    masks[i, : crossover_points[i, j]] = True
+                else:
+                    last_point = crossover_points[i, j - 1]
+                    masks[i, last_point : crossover_points[i, j]] = j % 2 == 0
+            # Handle the last segment
+            last_point = crossover_points[i, -1]
             masks[i, last_point:] = num_points % 2 == 0
+        # Perform crossover
         population_array = np.array([list(seq[0]) for seq in population])
         child1_array = np.where(
             masks,
@@ -251,23 +305,19 @@ class OmniModelForRNADesign(torch.nn.Module):
     def _evaluate_structure_fitness(self, sequences, structure):
         """
         Evaluate the fitness of the RNA structure by comparing with the target structure.
         Args:
             sequences (list): List of (sequence, bp_span) tuples to evaluate
             structure (str): Target RNA structure
         Returns:
             list: Sorted population with fitness scores and MFE values
         """
-        if self.parallel:
-            with ProcessPoolExecutor() as executor:
-                structures_mfe = list(
-                    executor.map(
-                        self._predict_structure_single, [seq for seq, _ in sequences]
-                    )
-                )
-        else:
-            structures_mfe = self._predict_structure([seq for seq, _ in sequences])
+        # Get sequences for structure prediction
+        seq_list = [seq for seq, _ in sequences]
+        # Predict structures (with improved multiprocessing)
+        structures_mfe = self._predict_structure(seq_list)
         sorted_population = []
         for (seq, bp_span), (ss, mfe) in zip(sequences, structures_mfe):
@@ -283,11 +333,11 @@ class OmniModelForRNADesign(torch.nn.Module):
     def _non_dominated_sorting(scores, mfe_values):
         """
         Perform non-dominated sorting for multi-objective optimization.
         Args:
             scores (list): Structure similarity scores
             mfe_values (list): Minimum free energy values
         Returns:
             list: List of fronts (Pareto fronts)
         """
@@ -326,11 +376,11 @@ class OmniModelForRNADesign(torch.nn.Module):
     def _select_next_generation(next_generation, fronts):
         """
         Select the next generation based on Pareto fronts.
         Args:
             next_generation (list): Current population with fitness scores
             fronts (list): Pareto fronts
         Returns:
             list: Selected population for the next generation
         """
@@ -346,11 +396,11 @@ class OmniModelForRNADesign(torch.nn.Module):
     def _mlm_predict(self, mlm_inputs, structure):
         """
         Perform masked language model prediction.
         Args:
             mlm_inputs (list): List of masked input sequences
             structure (str): Target RNA structure
         Returns:
             list: Predicted token IDs for each input
         """
@@ -360,7 +410,7 @@ class OmniModelForRNADesign(torch.nn.Module):
         with torch.no_grad():
             for i in range(0, len(mlm_inputs), batch_size):
                 inputs = self.tokenizer(
-                    mlm_inputs[i: i + batch_size],
+                    mlm_inputs[i : i + batch_size],
                     padding=False,
                     max_length=1024,
                     truncation=True,
@@ -379,13 +429,13 @@ class OmniModelForRNADesign(torch.nn.Module):
     ):
         """
         Design RNA sequences for a target structure using evolutionary algorithms.
         Args:
             structure (str): Target RNA structure in dot-bracket notation
             mutation_ratio (float): Ratio of tokens to mutate (default: 0.5)
             num_population (int): Population size (default: 100)
             num_generation (int): Number of generations (default: 100)
         Returns:
             list: List of designed RNA sequences with their fitness scores
         """

omnigenome/src/model/seq2seq/__init__.py CHANGED Viewed

@@ -9,4 +9,3 @@
 """
 This package contains modules for sequence-to-sequence models.
 """

omnigenome/src/model/seq2seq/model.py CHANGED Viewed

@@ -21,20 +21,20 @@ from ...abc.abstract_model import OmniModel
 class OmniModelForSeq2Seq(OmniModel):
     """
     Sequence-to-sequence model for genomic sequences.
     This model implements a sequence-to-sequence architecture for genomic
     sequences, where the input is one sequence and the output is another
     sequence. It's useful for tasks like sequence translation, structure
     prediction, or sequence transformation.
     The model can be extended to implement specific seq2seq tasks by
     overriding the forward, predict, and inference methods.
     """
     def __init__(self, config_or_model, tokenizer, *args, **kwargs):
         """
         Initialize the sequence-to-sequence model.
         Args:
             config_or_model: Model configuration or pre-trained model
             tokenizer: Tokenizer for processing input sequences

omnigenome/src/tokenizer/bpe_tokenizer.py CHANGED Viewed

@@ -17,17 +17,17 @@ warnings.filterwarnings("once")
 def is_bpe_tokenization(tokens, threshold=0.1):
     """
     Check if the tokenization is BPE-based by analyzing token characteristics.
     This function examines the tokens to determine if they follow BPE tokenization
     patterns by analyzing token length distributions and special token patterns.
     Args:
         tokens (list): List of tokens to analyze
         threshold (float, optional): Threshold for determining BPE tokenization. Defaults to 0.1
     Returns:
         bool: True if tokens appear to be BPE-based, False otherwise
     Example:
         >>> tokens = ["▁hello", "▁world", "▁how", "▁are", "▁you"]
         >>> is_bpe = is_bpe_tokenization(tokens)
@@ -52,15 +52,15 @@ def is_bpe_tokenization(tokens, threshold=0.1):
 class OmniBPETokenizer(OmniTokenizer):
     """
     A Byte Pair Encoding (BPE) tokenizer for genomic sequences.
     This tokenizer uses BPE tokenization for genomic sequences and provides
     validation to ensure the base tokenizer is BPE-based. It supports sequence
     preprocessing and handles various input formats.
     Attributes:
         base_tokenizer: The underlying BPE tokenizer
         metadata: Dictionary containing tokenizer metadata
     Example:
         >>> from omnigenome.src.tokenizer import OmniBPETokenizer
         >>> from transformers import AutoTokenizer
@@ -75,7 +75,7 @@ class OmniBPETokenizer(OmniTokenizer):
     def __init__(self, base_tokenizer=None, **kwargs):
         """
         Initialize the OmniBPETokenizer.
         Args:
             base_tokenizer: The base BPE tokenizer
             **kwargs: Additional keyword arguments passed to parent class
@@ -86,21 +86,21 @@ class OmniBPETokenizer(OmniTokenizer):
     def __call__(self, sequence, **kwargs):
         """
         Tokenize a sequence using BPE tokenization.
         This method processes the input sequence using BPE tokenization,
         handles sequence preprocessing (U/T conversion, whitespace addition),
         and validates that the tokenization is BPE-based.
         Args:
             sequence (str): Input sequence to tokenize
             **kwargs: Additional keyword arguments including max_length
         Returns:
             dict: Dictionary containing tokenized inputs with keys 'input_ids' and 'attention_mask'
         Raises:
             ValueError: If the tokenizer is not BPE-based
         Example:
             >>> sequence = "ACGUAGGUAUCGUAGA"
             >>> tokenized = tokenizer(sequence)
@@ -136,14 +136,14 @@ class OmniBPETokenizer(OmniTokenizer):
     def from_pretrained(model_name_or_path, **kwargs):
         """
         Create a BPE tokenizer from a pre-trained model.
         Args:
             model_name_or_path (str): Name or path of the pre-trained model
             **kwargs: Additional keyword arguments
         Returns:
             OmniBPETokenizer: Initialized BPE tokenizer
         Example:
             >>> tokenizer = OmniBPETokenizer.from_pretrained("facebook/esm2_t12_35M_UR50D")
             >>> print(type(tokenizer))
@@ -159,14 +159,14 @@ class OmniBPETokenizer(OmniTokenizer):
     def tokenize(self, sequence, **kwargs):
         """
         Tokenize a sequence using the base BPE tokenizer.
         Args:
             sequence (str): Input sequence to tokenize
             **kwargs: Additional keyword arguments
         Returns:
             list: List of tokens
         Example:
             >>> sequence = "ACGUAGGUAUCGUAGA"
             >>> tokens = tokenizer.tokenize(sequence)
@@ -178,17 +178,17 @@ class OmniBPETokenizer(OmniTokenizer):
     def encode(self, sequence, **kwargs):
         """
         Encode a sequence using the base BPE tokenizer.
         Args:
             sequence (str): Input sequence to encode
             **kwargs: Additional keyword arguments
         Returns:
             list: List of token IDs
         Raises:
             AssertionError: If the base tokenizer is not BPE-based
         Example:
             >>> sequence = "ACGUAGGUAUCGUAGA"
             >>> token_ids = tokenizer.encode(sequence)
@@ -203,17 +203,17 @@ class OmniBPETokenizer(OmniTokenizer):
     def decode(self, sequence, **kwargs):
         """
         Decode a sequence using the base BPE tokenizer.
         Args:
             sequence: Input sequence to decode (can be token IDs or tokens)
             **kwargs: Additional keyword arguments
         Returns:
             str: Decoded sequence
         Raises:
             AssertionError: If the base tokenizer is not BPE-based
         Example:
             >>> token_ids = [1, 2, 3, 4, 5]
             >>> sequence = tokenizer.decode(token_ids)

omnigenome 0.3.0a0__py3-none-any.whl → 0.3.1a0__py3-none-any.whl

omnigenome 0.3.0a0py3-none-any.whl → 0.3.1a0py3-none-any.whl