valuesets 0.3.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of valuesets might be problematic. Click here for more details.
- valuesets/__init__.py +7 -0
- valuesets/_version.py +8 -0
- valuesets/datamodel/valuesets.py +13796 -0
- valuesets/datamodel/valuesets_dataclass.py +24503 -0
- valuesets/datamodel/valuesets_pydantic.py +13796 -0
- valuesets/enums/__init__.py +590 -0
- valuesets/enums/academic/__init__.py +1 -0
- valuesets/enums/academic/research.py +559 -0
- valuesets/enums/analytical_chemistry/__init__.py +1 -0
- valuesets/enums/analytical_chemistry/mass_spectrometry.py +198 -0
- valuesets/enums/bio/__init__.py +1 -0
- valuesets/enums/bio/biological_colors.py +238 -0
- valuesets/enums/bio/cell_cycle.py +180 -0
- valuesets/enums/bio/currency_chemicals.py +52 -0
- valuesets/enums/bio/developmental_stages.py +103 -0
- valuesets/enums/bio/genome_features.py +182 -0
- valuesets/enums/bio/genomics.py +91 -0
- valuesets/enums/bio/go_aspect.py +32 -0
- valuesets/enums/bio/go_causality.py +58 -0
- valuesets/enums/bio/go_evidence.py +129 -0
- valuesets/enums/bio/human_developmental_stages.py +62 -0
- valuesets/enums/bio/insdc_geographic_locations.py +591 -0
- valuesets/enums/bio/insdc_missing_values.py +49 -0
- valuesets/enums/bio/lipid_categories.py +67 -0
- valuesets/enums/bio/mouse_developmental_stages.py +62 -0
- valuesets/enums/bio/plant_biology.py +86 -0
- valuesets/enums/bio/plant_developmental_stages.py +54 -0
- valuesets/enums/bio/plant_sex.py +81 -0
- valuesets/enums/bio/protein_evidence.py +61 -0
- valuesets/enums/bio/proteomics_standards.py +123 -0
- valuesets/enums/bio/psi_mi.py +306 -0
- valuesets/enums/bio/relationship_to_oxygen.py +37 -0
- valuesets/enums/bio/sequence_alphabets.py +449 -0
- valuesets/enums/bio/sequence_chemistry.py +357 -0
- valuesets/enums/bio/sequencing_platforms.py +302 -0
- valuesets/enums/bio/structural_biology.py +320 -0
- valuesets/enums/bio/taxonomy.py +238 -0
- valuesets/enums/bio/trophic_levels.py +85 -0
- valuesets/enums/bio/uniprot_species.py +344 -0
- valuesets/enums/bio/viral_genome_types.py +47 -0
- valuesets/enums/bioprocessing/__init__.py +1 -0
- valuesets/enums/bioprocessing/scale_up.py +249 -0
- valuesets/enums/business/__init__.py +1 -0
- valuesets/enums/business/human_resources.py +275 -0
- valuesets/enums/business/industry_classifications.py +181 -0
- valuesets/enums/business/management_operations.py +228 -0
- valuesets/enums/business/organizational_structures.py +236 -0
- valuesets/enums/business/quality_management.py +181 -0
- valuesets/enums/business/supply_chain.py +232 -0
- valuesets/enums/chemistry/__init__.py +1 -0
- valuesets/enums/chemistry/chemical_entities.py +315 -0
- valuesets/enums/chemistry/reaction_directionality.py +65 -0
- valuesets/enums/chemistry/reactions.py +256 -0
- valuesets/enums/clinical/__init__.py +1 -0
- valuesets/enums/clinical/nih_demographics.py +177 -0
- valuesets/enums/clinical/phenopackets.py +254 -0
- valuesets/enums/common_value_sets.py +8791 -0
- valuesets/enums/computing/__init__.py +1 -0
- valuesets/enums/computing/file_formats.py +294 -0
- valuesets/enums/computing/maturity_levels.py +196 -0
- valuesets/enums/computing/mime_types.py +227 -0
- valuesets/enums/confidence_levels.py +168 -0
- valuesets/enums/contributor.py +30 -0
- valuesets/enums/core.py +42 -0
- valuesets/enums/data/__init__.py +1 -0
- valuesets/enums/data/data_absent_reason.py +53 -0
- valuesets/enums/data_science/__init__.py +1 -0
- valuesets/enums/data_science/binary_classification.py +87 -0
- valuesets/enums/data_science/emotion_classification.py +66 -0
- valuesets/enums/data_science/priority_severity.py +73 -0
- valuesets/enums/data_science/quality_control.py +46 -0
- valuesets/enums/data_science/sentiment_analysis.py +50 -0
- valuesets/enums/data_science/text_classification.py +97 -0
- valuesets/enums/demographics.py +206 -0
- valuesets/enums/ecological_interactions.py +151 -0
- valuesets/enums/energy/__init__.py +1 -0
- valuesets/enums/energy/energy.py +343 -0
- valuesets/enums/energy/fossil_fuels.py +29 -0
- valuesets/enums/energy/nuclear/__init__.py +1 -0
- valuesets/enums/energy/nuclear/nuclear_facilities.py +195 -0
- valuesets/enums/energy/nuclear/nuclear_fuel_cycle.py +96 -0
- valuesets/enums/energy/nuclear/nuclear_fuels.py +175 -0
- valuesets/enums/energy/nuclear/nuclear_operations.py +191 -0
- valuesets/enums/energy/nuclear/nuclear_regulatory.py +188 -0
- valuesets/enums/energy/nuclear/nuclear_safety.py +164 -0
- valuesets/enums/energy/nuclear/nuclear_waste.py +158 -0
- valuesets/enums/energy/nuclear/reactor_types.py +163 -0
- valuesets/enums/environmental_health/__init__.py +1 -0
- valuesets/enums/environmental_health/exposures.py +265 -0
- valuesets/enums/geography/__init__.py +1 -0
- valuesets/enums/geography/geographic_codes.py +741 -0
- valuesets/enums/health/__init__.py +12 -0
- valuesets/enums/health/vaccination.py +98 -0
- valuesets/enums/health.py +36 -0
- valuesets/enums/health_base.py +36 -0
- valuesets/enums/healthcare.py +45 -0
- valuesets/enums/industry/__init__.py +1 -0
- valuesets/enums/industry/extractive_industry.py +94 -0
- valuesets/enums/industry/mining.py +388 -0
- valuesets/enums/industry/safety_colors.py +201 -0
- valuesets/enums/investigation.py +27 -0
- valuesets/enums/materials_science/__init__.py +1 -0
- valuesets/enums/materials_science/characterization_methods.py +112 -0
- valuesets/enums/materials_science/crystal_structures.py +76 -0
- valuesets/enums/materials_science/material_properties.py +119 -0
- valuesets/enums/materials_science/material_types.py +104 -0
- valuesets/enums/materials_science/pigments_dyes.py +198 -0
- valuesets/enums/materials_science/synthesis_methods.py +109 -0
- valuesets/enums/medical/__init__.py +1 -0
- valuesets/enums/medical/clinical.py +277 -0
- valuesets/enums/medical/neuroimaging.py +119 -0
- valuesets/enums/mining_processing.py +302 -0
- valuesets/enums/physics/__init__.py +1 -0
- valuesets/enums/physics/states_of_matter.py +46 -0
- valuesets/enums/social/__init__.py +1 -0
- valuesets/enums/social/person_status.py +29 -0
- valuesets/enums/spatial/__init__.py +1 -0
- valuesets/enums/spatial/spatial_qualifiers.py +246 -0
- valuesets/enums/statistics/__init__.py +5 -0
- valuesets/enums/statistics/prediction_outcomes.py +31 -0
- valuesets/enums/statistics.py +31 -0
- valuesets/enums/time/__init__.py +1 -0
- valuesets/enums/time/temporal.py +254 -0
- valuesets/enums/units/__init__.py +1 -0
- valuesets/enums/units/measurements.py +310 -0
- valuesets/enums/visual/__init__.py +1 -0
- valuesets/enums/visual/colors.py +376 -0
- valuesets/generators/__init__.py +19 -0
- valuesets/generators/auto_slot_injector.py +280 -0
- valuesets/generators/enhanced_pydantic_generator.py +100 -0
- valuesets/generators/enum_slot_generator.py +201 -0
- valuesets/generators/modular_rich_generator.py +353 -0
- valuesets/generators/prefix_standardizer.py +198 -0
- valuesets/generators/rich_enum.py +127 -0
- valuesets/generators/rich_pydantic_generator.py +310 -0
- valuesets/generators/smart_slot_syncer.py +428 -0
- valuesets/generators/sssom_generator.py +394 -0
- valuesets/merged/merged_hierarchy.yaml +21649 -0
- valuesets/schema/README.md +3 -0
- valuesets/schema/academic/research.yaml +911 -0
- valuesets/schema/analytical_chemistry/mass_spectrometry.yaml +206 -0
- valuesets/schema/bio/bio_entities.yaml +364 -0
- valuesets/schema/bio/biological_colors.yaml +434 -0
- valuesets/schema/bio/cell_cycle.yaml +309 -0
- valuesets/schema/bio/currency_chemicals.yaml +70 -0
- valuesets/schema/bio/developmental_stages.yaml +226 -0
- valuesets/schema/bio/genome_features.yaml +342 -0
- valuesets/schema/bio/genomics.yaml +101 -0
- valuesets/schema/bio/go_aspect.yaml +39 -0
- valuesets/schema/bio/go_causality.yaml +119 -0
- valuesets/schema/bio/go_evidence.yaml +215 -0
- valuesets/schema/bio/insdc_geographic_locations.yaml +911 -0
- valuesets/schema/bio/insdc_missing_values.yaml +85 -0
- valuesets/schema/bio/lipid_categories.yaml +72 -0
- valuesets/schema/bio/plant_biology.yaml +125 -0
- valuesets/schema/bio/plant_developmental_stages.yaml +77 -0
- valuesets/schema/bio/plant_sex.yaml +108 -0
- valuesets/schema/bio/protein_evidence.yaml +63 -0
- valuesets/schema/bio/proteomics_standards.yaml +116 -0
- valuesets/schema/bio/psi_mi.yaml +400 -0
- valuesets/schema/bio/relationship_to_oxygen.yaml +46 -0
- valuesets/schema/bio/sequence_alphabets.yaml +1168 -0
- valuesets/schema/bio/sequence_chemistry.yaml +477 -0
- valuesets/schema/bio/sequencing_platforms.yaml +515 -0
- valuesets/schema/bio/structural_biology.yaml +428 -0
- valuesets/schema/bio/taxonomy.yaml +453 -0
- valuesets/schema/bio/trophic_levels.yaml +118 -0
- valuesets/schema/bio/uniprot_species.yaml +1209 -0
- valuesets/schema/bio/viral_genome_types.yaml +99 -0
- valuesets/schema/bioprocessing/scale_up.yaml +458 -0
- valuesets/schema/business/human_resources.yaml +752 -0
- valuesets/schema/business/industry_classifications.yaml +448 -0
- valuesets/schema/business/management_operations.yaml +602 -0
- valuesets/schema/business/organizational_structures.yaml +645 -0
- valuesets/schema/business/quality_management.yaml +502 -0
- valuesets/schema/business/supply_chain.yaml +688 -0
- valuesets/schema/chemistry/chemical_entities.yaml +639 -0
- valuesets/schema/chemistry/reaction_directionality.yaml +60 -0
- valuesets/schema/chemistry/reactions.yaml +442 -0
- valuesets/schema/clinical/nih_demographics.yaml +285 -0
- valuesets/schema/clinical/phenopackets.yaml +429 -0
- valuesets/schema/computing/file_formats.yaml +631 -0
- valuesets/schema/computing/maturity_levels.yaml +229 -0
- valuesets/schema/computing/mime_types.yaml +266 -0
- valuesets/schema/confidence_levels.yaml +206 -0
- valuesets/schema/contributor.yaml +30 -0
- valuesets/schema/core.yaml +55 -0
- valuesets/schema/data/data_absent_reason.yaml +82 -0
- valuesets/schema/data_science/binary_classification.yaml +125 -0
- valuesets/schema/data_science/emotion_classification.yaml +109 -0
- valuesets/schema/data_science/priority_severity.yaml +122 -0
- valuesets/schema/data_science/quality_control.yaml +68 -0
- valuesets/schema/data_science/sentiment_analysis.yaml +81 -0
- valuesets/schema/data_science/text_classification.yaml +135 -0
- valuesets/schema/demographics.yaml +238 -0
- valuesets/schema/ecological_interactions.yaml +298 -0
- valuesets/schema/energy/energy.yaml +595 -0
- valuesets/schema/energy/fossil_fuels.yaml +28 -0
- valuesets/schema/energy/nuclear/nuclear_facilities.yaml +463 -0
- valuesets/schema/energy/nuclear/nuclear_fuel_cycle.yaml +82 -0
- valuesets/schema/energy/nuclear/nuclear_fuels.yaml +421 -0
- valuesets/schema/energy/nuclear/nuclear_operations.yaml +480 -0
- valuesets/schema/energy/nuclear/nuclear_regulatory.yaml +200 -0
- valuesets/schema/energy/nuclear/nuclear_safety.yaml +352 -0
- valuesets/schema/energy/nuclear/nuclear_waste.yaml +332 -0
- valuesets/schema/energy/nuclear/reactor_types.yaml +394 -0
- valuesets/schema/environmental_health/exposures.yaml +355 -0
- valuesets/schema/generated_slots.yaml +1828 -0
- valuesets/schema/geography/geographic_codes.yaml +1018 -0
- valuesets/schema/health/vaccination.yaml +102 -0
- valuesets/schema/health.yaml +38 -0
- valuesets/schema/healthcare.yaml +53 -0
- valuesets/schema/industry/extractive_industry.yaml +89 -0
- valuesets/schema/industry/mining.yaml +888 -0
- valuesets/schema/industry/safety_colors.yaml +375 -0
- valuesets/schema/investigation.yaml +64 -0
- valuesets/schema/materials_science/characterization_methods.yaml +193 -0
- valuesets/schema/materials_science/crystal_structures.yaml +138 -0
- valuesets/schema/materials_science/material_properties.yaml +135 -0
- valuesets/schema/materials_science/material_types.yaml +151 -0
- valuesets/schema/materials_science/pigments_dyes.yaml +465 -0
- valuesets/schema/materials_science/synthesis_methods.yaml +186 -0
- valuesets/schema/medical/clinical.yaml +610 -0
- valuesets/schema/medical/neuroimaging.yaml +325 -0
- valuesets/schema/mining_processing.yaml +295 -0
- valuesets/schema/physics/states_of_matter.yaml +46 -0
- valuesets/schema/slot_mixins.yaml +143 -0
- valuesets/schema/social/person_status.yaml +28 -0
- valuesets/schema/spatial/spatial_qualifiers.yaml +466 -0
- valuesets/schema/statistics/prediction_outcomes.yaml +26 -0
- valuesets/schema/statistics.yaml +34 -0
- valuesets/schema/time/temporal.yaml +435 -0
- valuesets/schema/types.yaml +15 -0
- valuesets/schema/units/measurements.yaml +675 -0
- valuesets/schema/valuesets.yaml +100 -0
- valuesets/schema/visual/colors.yaml +778 -0
- valuesets/utils/__init__.py +6 -0
- valuesets/utils/comparison.py +102 -0
- valuesets/utils/expand_dynamic_enums.py +414 -0
- valuesets/utils/mapping_utils.py +236 -0
- valuesets/validators/__init__.py +11 -0
- valuesets/validators/enum_evaluator.py +669 -0
- valuesets/validators/oak_config.yaml +70 -0
- valuesets/validators/validate_with_ols.py +241 -0
- valuesets-0.3.1.dist-info/METADATA +395 -0
- valuesets-0.3.1.dist-info/RECORD +248 -0
- valuesets-0.3.1.dist-info/WHEEL +4 -0
- valuesets-0.3.1.dist-info/licenses/LICENSE +201 -0
|
@@ -0,0 +1,52 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Currency Chemicals Value Sets
|
|
3
|
+
|
|
4
|
+
Value sets for metabolic currency molecules and cofactors used in energy transfer and redox reactions
|
|
5
|
+
|
|
6
|
+
Generated from: bio/currency_chemicals.yaml
|
|
7
|
+
"""
|
|
8
|
+
|
|
9
|
+
from __future__ import annotations
|
|
10
|
+
|
|
11
|
+
from typing import Dict, Any, Optional
|
|
12
|
+
from valuesets.generators.rich_enum import RichEnum
|
|
13
|
+
|
|
14
|
+
class CurrencyChemical(RichEnum):
|
|
15
|
+
"""
|
|
16
|
+
Common metabolic currency molecules and cofactors that serve as energy carriers, electron donors/acceptors, and group transfer agents in cellular metabolism.
|
|
17
|
+
"""
|
|
18
|
+
# Enum members
|
|
19
|
+
ATP = "ATP"
|
|
20
|
+
ADP = "ADP"
|
|
21
|
+
AMP = "AMP"
|
|
22
|
+
GTP = "GTP"
|
|
23
|
+
GDP = "GDP"
|
|
24
|
+
NAD_PLUS = "NAD_PLUS"
|
|
25
|
+
NADH = "NADH"
|
|
26
|
+
NADP_PLUS = "NADP_PLUS"
|
|
27
|
+
NADPH = "NADPH"
|
|
28
|
+
FAD = "FAD"
|
|
29
|
+
FADH2 = "FADH2"
|
|
30
|
+
COA = "COA"
|
|
31
|
+
ACETYL_COA = "ACETYL_COA"
|
|
32
|
+
|
|
33
|
+
# Set metadata after class creation
|
|
34
|
+
CurrencyChemical._metadata = {
|
|
35
|
+
"ATP": {'description': 'Adenosine triphosphate - primary energy currency molecule in cells', 'meaning': 'CHEBI:15422'},
|
|
36
|
+
"ADP": {'description': 'Adenosine diphosphate - product of ATP hydrolysis, energy acceptor', 'meaning': 'CHEBI:16761'},
|
|
37
|
+
"AMP": {'description': 'Adenosine monophosphate - nucleotide, product of ADP hydrolysis', 'meaning': 'CHEBI:16027', 'aliases': ["adenosine 5'-monophosphate"]},
|
|
38
|
+
"GTP": {'description': 'Guanosine triphosphate - energy molecule, protein synthesis and signaling', 'meaning': 'CHEBI:15996'},
|
|
39
|
+
"GDP": {'description': 'Guanosine diphosphate - product of GTP hydrolysis', 'meaning': 'CHEBI:17552'},
|
|
40
|
+
"NAD_PLUS": {'description': 'Nicotinamide adenine dinucleotide (oxidized) - electron acceptor in catabolism', 'meaning': 'CHEBI:15846'},
|
|
41
|
+
"NADH": {'description': 'Nicotinamide adenine dinucleotide (reduced) - electron donor, reducing agent', 'meaning': 'CHEBI:16908'},
|
|
42
|
+
"NADP_PLUS": {'description': 'Nicotinamide adenine dinucleotide phosphate (oxidized) - electron acceptor', 'meaning': 'CHEBI:18009'},
|
|
43
|
+
"NADPH": {'description': 'Nicotinamide adenine dinucleotide phosphate (reduced) - anabolic reducing agent', 'meaning': 'CHEBI:16474'},
|
|
44
|
+
"FAD": {'description': 'Flavin adenine dinucleotide (oxidized) - electron acceptor in oxidation reactions', 'meaning': 'CHEBI:16238'},
|
|
45
|
+
"FADH2": {'description': 'Flavin adenine dinucleotide (reduced) - electron donor in electron transport chain', 'meaning': 'CHEBI:17877'},
|
|
46
|
+
"COA": {'description': 'Coenzyme A - acyl group carrier in fatty acid metabolism', 'meaning': 'CHEBI:15346', 'aliases': ['coenzyme A']},
|
|
47
|
+
"ACETYL_COA": {'description': 'Acetyl coenzyme A - central metabolic intermediate, links glycolysis to citric acid cycle', 'meaning': 'CHEBI:15351'},
|
|
48
|
+
}
|
|
49
|
+
|
|
50
|
+
__all__ = [
|
|
51
|
+
"CurrencyChemical",
|
|
52
|
+
]
|
|
@@ -0,0 +1,103 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Developmental Stages Value Sets
|
|
3
|
+
|
|
4
|
+
Ontology-mapped developmental stages for human and mouse organisms. Human stages use HsapDv (Human Developmental Stages) ontology. Mouse stages use MmusDv (Mouse Developmental Stages) ontology.
|
|
5
|
+
|
|
6
|
+
Generated from: bio/developmental_stages.yaml
|
|
7
|
+
"""
|
|
8
|
+
|
|
9
|
+
from __future__ import annotations
|
|
10
|
+
|
|
11
|
+
from typing import Dict, Any, Optional
|
|
12
|
+
from valuesets.generators.rich_enum import RichEnum
|
|
13
|
+
|
|
14
|
+
class HumanDevelopmentalStage(RichEnum):
|
|
15
|
+
# Enum members
|
|
16
|
+
ZYGOTE_STAGE = "ZYGOTE_STAGE"
|
|
17
|
+
CLEAVAGE_STAGE = "CLEAVAGE_STAGE"
|
|
18
|
+
MORULA_STAGE = "MORULA_STAGE"
|
|
19
|
+
BLASTOCYST_STAGE = "BLASTOCYST_STAGE"
|
|
20
|
+
GASTRULA_STAGE = "GASTRULA_STAGE"
|
|
21
|
+
NEURULA_STAGE = "NEURULA_STAGE"
|
|
22
|
+
ORGANOGENESIS_STAGE = "ORGANOGENESIS_STAGE"
|
|
23
|
+
FETAL_STAGE = "FETAL_STAGE"
|
|
24
|
+
NEONATAL_STAGE = "NEONATAL_STAGE"
|
|
25
|
+
INFANT_STAGE = "INFANT_STAGE"
|
|
26
|
+
TODDLER_STAGE = "TODDLER_STAGE"
|
|
27
|
+
CHILD_STAGE = "CHILD_STAGE"
|
|
28
|
+
ADOLESCENT_STAGE = "ADOLESCENT_STAGE"
|
|
29
|
+
ADULT_STAGE = "ADULT_STAGE"
|
|
30
|
+
AGED_STAGE = "AGED_STAGE"
|
|
31
|
+
EMBRYONIC_STAGE = "EMBRYONIC_STAGE"
|
|
32
|
+
PRENATAL_STAGE = "PRENATAL_STAGE"
|
|
33
|
+
POSTNATAL_STAGE = "POSTNATAL_STAGE"
|
|
34
|
+
|
|
35
|
+
# Set metadata after class creation
|
|
36
|
+
HumanDevelopmentalStage._metadata = {
|
|
37
|
+
"ZYGOTE_STAGE": {'description': 'Embryonic stage defined by a fertilized oocyte and presence of pronuclei. Starts at day 1 post-fertilization.', 'meaning': 'HsapDv:0000003'},
|
|
38
|
+
"CLEAVAGE_STAGE": {'description': 'Embryonic stage during which cell division occurs with reduction in cytoplasmic volume, and formation of inner and outer cell mass. 2-8 cells. Usually starts between day 2-3 post-fertilization.', 'meaning': 'HsapDv:0000005'},
|
|
39
|
+
"MORULA_STAGE": {'description': 'The later part of Carnegie stage 02 when the cells have coalesced into a mass but the blastocystic cavity has not formed.', 'meaning': 'HsapDv:0000205'},
|
|
40
|
+
"BLASTOCYST_STAGE": {'description': 'Blastula stage with the loss of the zona pellucida and the definition of a free blastocyst. Usually starts between day 4-5 post-fertilization.', 'meaning': 'HsapDv:0000007'},
|
|
41
|
+
"GASTRULA_STAGE": {'description': 'Embryonic stage defined by a complex and coordinated series of cellular movements that occurs at the end of cleavage.', 'meaning': 'HsapDv:0000010'},
|
|
42
|
+
"NEURULA_STAGE": {'description': 'Embryonic stage defined by the formation of a tube from the flat layer of ectodermal cells known as the neural plate. This stage starts the emergence of the central nervous system.', 'meaning': 'HsapDv:0000012'},
|
|
43
|
+
"ORGANOGENESIS_STAGE": {'description': 'Embryonic stage at which the ectoderm, endoderm, and mesoderm develop into the internal organs of the organism.', 'meaning': 'HsapDv:0000015'},
|
|
44
|
+
"FETAL_STAGE": {'description': 'Prenatal stage that starts with the fully formed embryo and ends at birth. Generally from 8 weeks post-fertilization until birth.', 'meaning': 'HsapDv:0000037'},
|
|
45
|
+
"NEONATAL_STAGE": {'description': 'Immature stage that refers to a human newborn within the first 28 days of life.', 'meaning': 'HsapDv:0000262'},
|
|
46
|
+
"INFANT_STAGE": {'description': 'Immature stage that refers to an infant who is over 28 days and is under 12 months old.', 'meaning': 'HsapDv:0000261'},
|
|
47
|
+
"TODDLER_STAGE": {'description': 'Human stage that refers to a child who is over 12 months and under 5 years old. Often divided into early toddler (1-2 years) and late toddler (2-3 years).', 'meaning': 'HsapDv:0000265'},
|
|
48
|
+
"CHILD_STAGE": {'description': 'Pediatric stage that refers to a human who is over 5 and under 15 years old. Covers elementary and middle school ages.', 'meaning': 'HsapDv:0000271'},
|
|
49
|
+
"ADOLESCENT_STAGE": {'description': 'A young adult stage that refers to an individual who is over 15 and under 20 years old. Period of transition from childhood to adulthood.', 'meaning': 'HsapDv:0000268'},
|
|
50
|
+
"ADULT_STAGE": {'description': 'Human developmental stage that refers to a sexually mature human. Starts at approximately 15 years according to HPO definitions.', 'meaning': 'HsapDv:0000258'},
|
|
51
|
+
"AGED_STAGE": {'description': 'Late adult stage that refers to an individual who is over 60 and starts to have some age-related impairments. Often subdivided into young-old (60-79) and old-old (80+).', 'meaning': 'HsapDv:0000227'},
|
|
52
|
+
"EMBRYONIC_STAGE": {'description': 'Prenatal stage that starts with fertilization and ends with a fully formed embryo, before undergoing last development during the fetal stage. Up to 8 weeks post-fertilization.', 'meaning': 'HsapDv:0000002'},
|
|
53
|
+
"PRENATAL_STAGE": {'description': 'Prenatal stage that starts with fertilization and ends at birth. Encompasses both embryonic and fetal stages.', 'meaning': 'HsapDv:0000045'},
|
|
54
|
+
"POSTNATAL_STAGE": {'description': 'Human developmental stage that covers the whole of human life post birth.', 'meaning': 'HsapDv:0010000'},
|
|
55
|
+
}
|
|
56
|
+
|
|
57
|
+
class MouseDevelopmentalStage(RichEnum):
|
|
58
|
+
# Enum members
|
|
59
|
+
ZYGOTE_STAGE = "ZYGOTE_STAGE"
|
|
60
|
+
TWO_CELL_STAGE = "TWO_CELL_STAGE"
|
|
61
|
+
FOUR_CELL_STAGE = "FOUR_CELL_STAGE"
|
|
62
|
+
EIGHT_CELL_STAGE = "EIGHT_CELL_STAGE"
|
|
63
|
+
MORULA_STAGE = "MORULA_STAGE"
|
|
64
|
+
BLASTOCYST_STAGE = "BLASTOCYST_STAGE"
|
|
65
|
+
GASTRULA_STAGE = "GASTRULA_STAGE"
|
|
66
|
+
NEURULA_STAGE = "NEURULA_STAGE"
|
|
67
|
+
ORGANOGENESIS_STAGE = "ORGANOGENESIS_STAGE"
|
|
68
|
+
E0_5 = "E0_5"
|
|
69
|
+
E9_5 = "E9_5"
|
|
70
|
+
E14_5 = "E14_5"
|
|
71
|
+
P0_NEWBORN = "P0_NEWBORN"
|
|
72
|
+
P21_WEANING = "P21_WEANING"
|
|
73
|
+
P42_JUVENILE = "P42_JUVENILE"
|
|
74
|
+
P56_ADULT = "P56_ADULT"
|
|
75
|
+
AGED_12_MONTHS = "AGED_12_MONTHS"
|
|
76
|
+
THEILER_STAGE = "THEILER_STAGE"
|
|
77
|
+
|
|
78
|
+
# Set metadata after class creation
|
|
79
|
+
MouseDevelopmentalStage._metadata = {
|
|
80
|
+
"ZYGOTE_STAGE": {'description': 'Embryonic stage defined by a one-cell embryo (fertilised egg) with zona pellucida present. Embryonic age 0-0.9 dpc (days post coitum).', 'meaning': 'MmusDv:0000003'},
|
|
81
|
+
"TWO_CELL_STAGE": {'description': 'Embryonic cleavage stage defined by a dividing 2-4 cells egg. Embryonic age 1 dpc.', 'meaning': 'MmusDv:0000005'},
|
|
82
|
+
"FOUR_CELL_STAGE": {'description': 'Part of Theiler stage 02 - dividing egg with 4 cells. Embryonic age approximately 1 dpc.', 'meaning': 'MmusDv:0000005'},
|
|
83
|
+
"EIGHT_CELL_STAGE": {'description': 'Part of early morula stage - dividing egg with 8 cells. Embryonic age approximately 2 dpc.', 'meaning': 'MmusDv:0000006'},
|
|
84
|
+
"MORULA_STAGE": {'description': 'Embryonic cleavage stage defined by a dividing 4-16 cells egg, early to fully compacted morula. Embryonic age 2 dpc.', 'meaning': 'MmusDv:0000006'},
|
|
85
|
+
"BLASTOCYST_STAGE": {'description': 'Embryonic blastula stage defined by a zona free blastocyst (zona pellucida absent). Embryonic age 4 dpc.', 'meaning': 'MmusDv:0000009'},
|
|
86
|
+
"GASTRULA_STAGE": {'description': 'Embryonic stage defined by complex and coordinated series of cellular movements that occurs at the end of cleavage.', 'meaning': 'MmusDv:0000013'},
|
|
87
|
+
"NEURULA_STAGE": {'description': 'Embryonic stage called presomite stage and defined by the formation of the neural plate. This stage starts the emergence of the central nervous system at embryonic age 7.5 dpc.', 'meaning': 'MmusDv:0000017'},
|
|
88
|
+
"ORGANOGENESIS_STAGE": {'description': 'Embryonic stage at which the ectoderm, endoderm, and mesoderm develop into the internal organs of the organism.', 'meaning': 'MmusDv:0000018'},
|
|
89
|
+
"E0_5": {'description': 'Embryonic day 0.5 - one-cell embryo stage. Corresponds to Theiler stage 01.', 'meaning': 'MmusDv:0000003'},
|
|
90
|
+
"E9_5": {'description': 'Embryonic day 9.5 - organogenesis stage with visible hind limb buds. Between Theiler stages 15 and 16.', 'meaning': 'MmusDv:0000023'},
|
|
91
|
+
"E14_5": {'description': 'Embryonic day 14.5 - late organogenesis with clearly visible fingers and long bones of the limbs present.', 'meaning': 'MmusDv:0000029'},
|
|
92
|
+
"P0_NEWBORN": {'description': 'Stage that refers to the newborn mouse, aged E19-20, P0. Used for postnatal days 0 through 3.', 'meaning': 'MmusDv:0000036'},
|
|
93
|
+
"P21_WEANING": {'description': 'Weaning stage at approximately 21-22 days old. Transition from nursing to independent feeding.', 'meaning': 'MmusDv:0000141'},
|
|
94
|
+
"P42_JUVENILE": {'description': 'Prime adult stage at 6 weeks (42 days) old. Commonly considered the milestone for sexual maturity.', 'meaning': 'MmusDv:0000151'},
|
|
95
|
+
"P56_ADULT": {'description': 'Adult stage at 8 weeks (56 days) old. Fully mature adult mouse.', 'meaning': 'MmusDv:0000154'},
|
|
96
|
+
"AGED_12_MONTHS": {'description': 'Middle aged stage for mice over 10 and under 18 months old. Shows progressive age-related changes.', 'meaning': 'MmusDv:0000135'},
|
|
97
|
+
"THEILER_STAGE": {'description': 'Reference to any Theiler stage (TS1-TS28) which provides standardized morphological staging for mouse development.'},
|
|
98
|
+
}
|
|
99
|
+
|
|
100
|
+
__all__ = [
|
|
101
|
+
"HumanDevelopmentalStage",
|
|
102
|
+
"MouseDevelopmentalStage",
|
|
103
|
+
]
|
|
@@ -0,0 +1,182 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Genome Feature Types
|
|
3
|
+
|
|
4
|
+
Genome feature types from SOFA (Sequence Ontology Feature Annotation),
|
|
5
|
+
the subset of SO used in GFF3 files for genome annotation.
|
|
6
|
+
Organized hierarchically following the Sequence Ontology structure.
|
|
7
|
+
|
|
8
|
+
Generated from: bio/genome_features.yaml
|
|
9
|
+
"""
|
|
10
|
+
|
|
11
|
+
from __future__ import annotations
|
|
12
|
+
|
|
13
|
+
from typing import Dict, Any, Optional
|
|
14
|
+
from valuesets.generators.rich_enum import RichEnum
|
|
15
|
+
|
|
16
|
+
class GenomeFeatureType(RichEnum):
|
|
17
|
+
"""
|
|
18
|
+
Genome feature types from SOFA (Sequence Ontology Feature Annotation).
|
|
19
|
+
This is the subset of Sequence Ontology terms used in GFF3 files.
|
|
20
|
+
Organized hierarchically following the Sequence Ontology structure.
|
|
21
|
+
"""
|
|
22
|
+
# Enum members
|
|
23
|
+
REGION = "REGION"
|
|
24
|
+
BIOLOGICAL_REGION = "BIOLOGICAL_REGION"
|
|
25
|
+
GENE = "GENE"
|
|
26
|
+
TRANSCRIPT = "TRANSCRIPT"
|
|
27
|
+
PRIMARY_TRANSCRIPT = "PRIMARY_TRANSCRIPT"
|
|
28
|
+
MRNA = "MRNA"
|
|
29
|
+
EXON = "EXON"
|
|
30
|
+
CDS = "CDS"
|
|
31
|
+
INTRON = "INTRON"
|
|
32
|
+
FIVE_PRIME_UTR = "FIVE_PRIME_UTR"
|
|
33
|
+
THREE_PRIME_UTR = "THREE_PRIME_UTR"
|
|
34
|
+
NCRNA = "NCRNA"
|
|
35
|
+
RRNA = "RRNA"
|
|
36
|
+
TRNA = "TRNA"
|
|
37
|
+
SNRNA = "SNRNA"
|
|
38
|
+
SNORNA = "SNORNA"
|
|
39
|
+
MIRNA = "MIRNA"
|
|
40
|
+
LNCRNA = "LNCRNA"
|
|
41
|
+
RIBOZYME = "RIBOZYME"
|
|
42
|
+
ANTISENSE_RNA = "ANTISENSE_RNA"
|
|
43
|
+
PSEUDOGENE = "PSEUDOGENE"
|
|
44
|
+
PROCESSED_PSEUDOGENE = "PROCESSED_PSEUDOGENE"
|
|
45
|
+
REGULATORY_REGION = "REGULATORY_REGION"
|
|
46
|
+
PROMOTER = "PROMOTER"
|
|
47
|
+
ENHANCER = "ENHANCER"
|
|
48
|
+
SILENCER = "SILENCER"
|
|
49
|
+
TERMINATOR = "TERMINATOR"
|
|
50
|
+
ATTENUATOR = "ATTENUATOR"
|
|
51
|
+
POLYA_SIGNAL_SEQUENCE = "POLYA_SIGNAL_SEQUENCE"
|
|
52
|
+
BINDING_SITE = "BINDING_SITE"
|
|
53
|
+
TFBS = "TFBS"
|
|
54
|
+
RIBOSOME_ENTRY_SITE = "RIBOSOME_ENTRY_SITE"
|
|
55
|
+
POLYA_SITE = "POLYA_SITE"
|
|
56
|
+
REPEAT_REGION = "REPEAT_REGION"
|
|
57
|
+
DISPERSED_REPEAT = "DISPERSED_REPEAT"
|
|
58
|
+
TANDEM_REPEAT = "TANDEM_REPEAT"
|
|
59
|
+
INVERTED_REPEAT = "INVERTED_REPEAT"
|
|
60
|
+
TRANSPOSABLE_ELEMENT = "TRANSPOSABLE_ELEMENT"
|
|
61
|
+
MOBILE_ELEMENT = "MOBILE_ELEMENT"
|
|
62
|
+
SEQUENCE_ALTERATION = "SEQUENCE_ALTERATION"
|
|
63
|
+
INSERTION = "INSERTION"
|
|
64
|
+
DELETION = "DELETION"
|
|
65
|
+
INVERSION = "INVERSION"
|
|
66
|
+
DUPLICATION = "DUPLICATION"
|
|
67
|
+
SUBSTITUTION = "SUBSTITUTION"
|
|
68
|
+
ORIGIN_OF_REPLICATION = "ORIGIN_OF_REPLICATION"
|
|
69
|
+
POLYC_TRACT = "POLYC_TRACT"
|
|
70
|
+
GAP = "GAP"
|
|
71
|
+
ASSEMBLY_GAP = "ASSEMBLY_GAP"
|
|
72
|
+
CHROMOSOME = "CHROMOSOME"
|
|
73
|
+
SUPERCONTIG = "SUPERCONTIG"
|
|
74
|
+
CONTIG = "CONTIG"
|
|
75
|
+
SCAFFOLD = "SCAFFOLD"
|
|
76
|
+
CLONE = "CLONE"
|
|
77
|
+
PLASMID = "PLASMID"
|
|
78
|
+
POLYPEPTIDE = "POLYPEPTIDE"
|
|
79
|
+
MATURE_PROTEIN_REGION = "MATURE_PROTEIN_REGION"
|
|
80
|
+
SIGNAL_PEPTIDE = "SIGNAL_PEPTIDE"
|
|
81
|
+
TRANSIT_PEPTIDE = "TRANSIT_PEPTIDE"
|
|
82
|
+
PROPEPTIDE = "PROPEPTIDE"
|
|
83
|
+
OPERON = "OPERON"
|
|
84
|
+
STEM_LOOP = "STEM_LOOP"
|
|
85
|
+
D_LOOP = "D_LOOP"
|
|
86
|
+
MATCH = "MATCH"
|
|
87
|
+
CDNA_MATCH = "CDNA_MATCH"
|
|
88
|
+
EST_MATCH = "EST_MATCH"
|
|
89
|
+
PROTEIN_MATCH = "PROTEIN_MATCH"
|
|
90
|
+
NUCLEOTIDE_MATCH = "NUCLEOTIDE_MATCH"
|
|
91
|
+
JUNCTION_FEATURE = "JUNCTION_FEATURE"
|
|
92
|
+
SPLICE_SITE = "SPLICE_SITE"
|
|
93
|
+
FIVE_PRIME_SPLICE_SITE = "FIVE_PRIME_SPLICE_SITE"
|
|
94
|
+
THREE_PRIME_SPLICE_SITE = "THREE_PRIME_SPLICE_SITE"
|
|
95
|
+
START_CODON = "START_CODON"
|
|
96
|
+
STOP_CODON = "STOP_CODON"
|
|
97
|
+
CENTROMERE = "CENTROMERE"
|
|
98
|
+
TELOMERE = "TELOMERE"
|
|
99
|
+
|
|
100
|
+
# Set metadata after class creation
|
|
101
|
+
GenomeFeatureType._metadata = {
|
|
102
|
+
"REGION": {'description': 'A sequence feature with an extent greater than zero', 'meaning': 'SO:0000001'},
|
|
103
|
+
"BIOLOGICAL_REGION": {'description': 'A region defined by its biological properties', 'meaning': 'SO:0001411'},
|
|
104
|
+
"GENE": {'description': 'A region (or regions) that includes all of the sequence elements necessary to encode a functional transcript', 'meaning': 'SO:0000704'},
|
|
105
|
+
"TRANSCRIPT": {'description': 'An RNA synthesized on a DNA or RNA template by an RNA polymerase', 'meaning': 'SO:0000673'},
|
|
106
|
+
"PRIMARY_TRANSCRIPT": {'description': 'A transcript that has not been processed', 'meaning': 'SO:0000185'},
|
|
107
|
+
"MRNA": {'description': "Messenger RNA; includes 5'UTR, coding sequences and 3'UTR", 'meaning': 'SO:0000234'},
|
|
108
|
+
"EXON": {'description': 'A region of the transcript sequence within a gene which is not removed from the primary RNA transcript by RNA splicing', 'meaning': 'SO:0000147'},
|
|
109
|
+
"CDS": {'description': 'Coding sequence; sequence of nucleotides that corresponds with the sequence of amino acids in a protein', 'meaning': 'SO:0000316'},
|
|
110
|
+
"INTRON": {'description': 'A region of a primary transcript that is transcribed, but removed from within the transcript by splicing', 'meaning': 'SO:0000188'},
|
|
111
|
+
"FIVE_PRIME_UTR": {'description': "5' untranslated region", 'meaning': 'SO:0000204'},
|
|
112
|
+
"THREE_PRIME_UTR": {'description': "3' untranslated region", 'meaning': 'SO:0000205'},
|
|
113
|
+
"NCRNA": {'description': 'Non-protein coding RNA', 'meaning': 'SO:0000655'},
|
|
114
|
+
"RRNA": {'description': 'Ribosomal RNA', 'meaning': 'SO:0000252'},
|
|
115
|
+
"TRNA": {'description': 'Transfer RNA', 'meaning': 'SO:0000253'},
|
|
116
|
+
"SNRNA": {'description': 'Small nuclear RNA', 'meaning': 'SO:0000274'},
|
|
117
|
+
"SNORNA": {'description': 'Small nucleolar RNA', 'meaning': 'SO:0000275'},
|
|
118
|
+
"MIRNA": {'description': 'MicroRNA', 'meaning': 'SO:0000276'},
|
|
119
|
+
"LNCRNA": {'description': 'Long non-coding RNA', 'meaning': 'SO:0001877'},
|
|
120
|
+
"RIBOZYME": {'description': 'An RNA with catalytic activity', 'meaning': 'SO:0000374'},
|
|
121
|
+
"ANTISENSE_RNA": {'description': 'RNA that is complementary to other RNA', 'meaning': 'SO:0000644'},
|
|
122
|
+
"PSEUDOGENE": {'description': 'A sequence that closely resembles a known functional gene but does not produce a functional product', 'meaning': 'SO:0000336'},
|
|
123
|
+
"PROCESSED_PSEUDOGENE": {'description': 'A pseudogene arising from reverse transcription of mRNA', 'meaning': 'SO:0000043'},
|
|
124
|
+
"REGULATORY_REGION": {'description': 'A region involved in the control of the process of gene expression', 'meaning': 'SO:0005836'},
|
|
125
|
+
"PROMOTER": {'description': 'A regulatory region initiating transcription', 'meaning': 'SO:0000167'},
|
|
126
|
+
"ENHANCER": {'description': 'A cis-acting sequence that increases transcription', 'meaning': 'SO:0000165'},
|
|
127
|
+
"SILENCER": {'description': 'A regulatory region which upon binding of transcription factors, suppresses transcription', 'meaning': 'SO:0000625'},
|
|
128
|
+
"TERMINATOR": {'description': 'The sequence of DNA located either at the end of the transcript that causes RNA polymerase to terminate transcription', 'meaning': 'SO:0000141'},
|
|
129
|
+
"ATTENUATOR": {'description': 'A sequence that causes transcription termination', 'meaning': 'SO:0000140'},
|
|
130
|
+
"POLYA_SIGNAL_SEQUENCE": {'description': 'The recognition sequence for the cleavage and polyadenylation machinery', 'meaning': 'SO:0000551'},
|
|
131
|
+
"BINDING_SITE": {'description': 'A region on a molecule that binds to another molecule', 'meaning': 'SO:0000409'},
|
|
132
|
+
"TFBS": {'description': 'Transcription factor binding site', 'meaning': 'SO:0000235'},
|
|
133
|
+
"RIBOSOME_ENTRY_SITE": {'description': 'Region where ribosome assembles on mRNA', 'meaning': 'SO:0000139'},
|
|
134
|
+
"POLYA_SITE": {'description': 'Polyadenylation site', 'meaning': 'SO:0000553'},
|
|
135
|
+
"REPEAT_REGION": {'description': 'A region of sequence containing one or more repeat units', 'meaning': 'SO:0000657'},
|
|
136
|
+
"DISPERSED_REPEAT": {'description': 'A repeat that is interspersed in the genome', 'meaning': 'SO:0000658'},
|
|
137
|
+
"TANDEM_REPEAT": {'description': 'A repeat where the same sequence is repeated in the same orientation', 'meaning': 'SO:0000705'},
|
|
138
|
+
"INVERTED_REPEAT": {'description': 'A repeat where the sequence is repeated in the opposite orientation', 'meaning': 'SO:0000294'},
|
|
139
|
+
"TRANSPOSABLE_ELEMENT": {'description': 'A DNA segment that can change its position within the genome', 'meaning': 'SO:0000101'},
|
|
140
|
+
"MOBILE_ELEMENT": {'description': 'A nucleotide region with the ability to move from one place in the genome to another', 'meaning': 'SO:0001037'},
|
|
141
|
+
"SEQUENCE_ALTERATION": {'description': 'A sequence that deviates from the reference sequence', 'meaning': 'SO:0001059'},
|
|
142
|
+
"INSERTION": {'description': 'The sequence of one or more nucleotides added between two adjacent nucleotides', 'meaning': 'SO:0000667'},
|
|
143
|
+
"DELETION": {'description': 'The removal of a sequences of nucleotides from the genome', 'meaning': 'SO:0000159'},
|
|
144
|
+
"INVERSION": {'description': 'A continuous nucleotide sequence is inverted in the same position', 'meaning': 'SO:1000036'},
|
|
145
|
+
"DUPLICATION": {'description': 'One or more nucleotides are added between two adjacent nucleotides', 'meaning': 'SO:1000035'},
|
|
146
|
+
"SUBSTITUTION": {'description': 'A sequence alteration where one nucleotide replaced by another', 'meaning': 'SO:1000002'},
|
|
147
|
+
"ORIGIN_OF_REPLICATION": {'description': 'The origin of replication; starting site for duplication of a nucleic acid molecule', 'meaning': 'SO:0000296'},
|
|
148
|
+
"POLYC_TRACT": {'description': 'A sequence of Cs'},
|
|
149
|
+
"GAP": {'description': 'A gap in the sequence', 'meaning': 'SO:0000730'},
|
|
150
|
+
"ASSEMBLY_GAP": {'description': 'A gap between two sequences in an assembly', 'meaning': 'SO:0000730'},
|
|
151
|
+
"CHROMOSOME": {'description': 'Structural unit composed of DNA and proteins', 'meaning': 'SO:0000340'},
|
|
152
|
+
"SUPERCONTIG": {'description': 'One or more contigs that have been ordered and oriented using end-read information', 'meaning': 'SO:0000148'},
|
|
153
|
+
"CONTIG": {'description': 'A contiguous sequence derived from sequence assembly', 'meaning': 'SO:0000149'},
|
|
154
|
+
"SCAFFOLD": {'description': 'One or more contigs that have been ordered and oriented', 'meaning': 'SO:0000148'},
|
|
155
|
+
"CLONE": {'description': 'A piece of DNA that has been inserted into a vector', 'meaning': 'SO:0000151'},
|
|
156
|
+
"PLASMID": {'description': 'A self-replicating circular DNA molecule', 'meaning': 'SO:0000155'},
|
|
157
|
+
"POLYPEPTIDE": {'description': 'A sequence of amino acids linked by peptide bonds', 'meaning': 'SO:0000104'},
|
|
158
|
+
"MATURE_PROTEIN_REGION": {'description': 'The polypeptide sequence that remains after post-translational processing', 'meaning': 'SO:0000419'},
|
|
159
|
+
"SIGNAL_PEPTIDE": {'description': 'A peptide region that targets a polypeptide to a specific location', 'meaning': 'SO:0000418'},
|
|
160
|
+
"TRANSIT_PEPTIDE": {'description': 'A peptide that directs the transport of a protein to an organelle', 'meaning': 'SO:0000725'},
|
|
161
|
+
"PROPEPTIDE": {'description': 'A peptide region that is cleaved during maturation', 'meaning': 'SO:0001062'},
|
|
162
|
+
"OPERON": {'description': 'A group of contiguous genes transcribed as a single unit', 'meaning': 'SO:0000178'},
|
|
163
|
+
"STEM_LOOP": {'description': 'A double-helical region formed by base-pairing between adjacent sequences', 'meaning': 'SO:0000313'},
|
|
164
|
+
"D_LOOP": {'description': 'Displacement loop; a region where DNA is displaced by an invading strand', 'meaning': 'SO:0000297'},
|
|
165
|
+
"MATCH": {'description': 'A region of sequence similarity', 'meaning': 'SO:0000343'},
|
|
166
|
+
"CDNA_MATCH": {'description': 'A match to a cDNA sequence', 'meaning': 'SO:0000689'},
|
|
167
|
+
"EST_MATCH": {'description': 'A match to an EST sequence', 'meaning': 'SO:0000668'},
|
|
168
|
+
"PROTEIN_MATCH": {'description': 'A match to a protein sequence', 'meaning': 'SO:0000349'},
|
|
169
|
+
"NUCLEOTIDE_MATCH": {'description': 'A match to a nucleotide sequence', 'meaning': 'SO:0000347'},
|
|
170
|
+
"JUNCTION_FEATURE": {'description': 'A boundary or junction between sequence regions', 'meaning': 'SO:0000699'},
|
|
171
|
+
"SPLICE_SITE": {'description': 'The position where intron is excised', 'meaning': 'SO:0000162'},
|
|
172
|
+
"FIVE_PRIME_SPLICE_SITE": {'description': "The 5' splice site (donor site)", 'meaning': 'SO:0000163'},
|
|
173
|
+
"THREE_PRIME_SPLICE_SITE": {'description': "The 3' splice site (acceptor site)", 'meaning': 'SO:0000164'},
|
|
174
|
+
"START_CODON": {'description': 'The first codon to be translated', 'meaning': 'SO:0000318'},
|
|
175
|
+
"STOP_CODON": {'description': 'The codon that terminates translation', 'meaning': 'SO:0000319'},
|
|
176
|
+
"CENTROMERE": {'description': 'A region where chromatids are held together', 'meaning': 'SO:0000577'},
|
|
177
|
+
"TELOMERE": {'description': 'The terminal region of a linear chromosome', 'meaning': 'SO:0000624'},
|
|
178
|
+
}
|
|
179
|
+
|
|
180
|
+
__all__ = [
|
|
181
|
+
"GenomeFeatureType",
|
|
182
|
+
]
|
|
@@ -0,0 +1,91 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Genomics Value Sets
|
|
3
|
+
|
|
4
|
+
Value sets related to genomics and sequencing
|
|
5
|
+
|
|
6
|
+
Generated from: bio/genomics.yaml
|
|
7
|
+
"""
|
|
8
|
+
|
|
9
|
+
from __future__ import annotations
|
|
10
|
+
|
|
11
|
+
from typing import Dict, Any, Optional
|
|
12
|
+
from valuesets.generators.rich_enum import RichEnum
|
|
13
|
+
|
|
14
|
+
class CdsPhaseType(RichEnum):
|
|
15
|
+
"""
|
|
16
|
+
For features of type CDS (coding sequence), the phase indicates where the feature begins with reference to the reading frame. The phase is one of the integers 0, 1, or 2, indicating the number of bases that should be removed from the beginning of this feature to reach the first base of the next codon.
|
|
17
|
+
"""
|
|
18
|
+
# Enum members
|
|
19
|
+
PHASE_0 = "PHASE_0"
|
|
20
|
+
PHASE_1 = "PHASE_1"
|
|
21
|
+
PHASE_2 = "PHASE_2"
|
|
22
|
+
|
|
23
|
+
# Set metadata after class creation
|
|
24
|
+
CdsPhaseType._metadata = {
|
|
25
|
+
"PHASE_0": {'description': 'Zero bases from reading frame to feature start.'},
|
|
26
|
+
"PHASE_1": {'description': 'One base from reading frame to feature start.'},
|
|
27
|
+
"PHASE_2": {'description': 'Two bases from reading frame to feature start.'},
|
|
28
|
+
}
|
|
29
|
+
|
|
30
|
+
class ContigCollectionType(RichEnum):
|
|
31
|
+
"""
|
|
32
|
+
The type of the contig set; the type of the 'omics data set. Terms are taken from the Genomics Standards Consortium where possible. See the GSC checklists at https://genomicsstandardsconsortium.github.io/mixs/ for the controlled vocabularies used.
|
|
33
|
+
"""
|
|
34
|
+
# Enum members
|
|
35
|
+
ISOLATE = "ISOLATE"
|
|
36
|
+
MAG = "MAG"
|
|
37
|
+
METAGENOME = "METAGENOME"
|
|
38
|
+
METATRANSCRIPTOME = "METATRANSCRIPTOME"
|
|
39
|
+
SAG = "SAG"
|
|
40
|
+
VIRUS = "VIRUS"
|
|
41
|
+
MARKER = "MARKER"
|
|
42
|
+
|
|
43
|
+
# Set metadata after class creation
|
|
44
|
+
ContigCollectionType._metadata = {
|
|
45
|
+
"ISOLATE": {'description': 'Sequences assembled from DNA of isolated organism. Bacteria/Archaea: https://genomicsstandardsconsortium.github.io/mixs/0010003/ Euk: https://genomicsstandardsconsortium.github.io/mixs/0010002/ Virus: https://genomicsstandardsconsortium.github.io/mixs/0010005/ Organelle: https://genomicsstandardsconsortium.github.io/mixs/0010006/ Plasmid: https://genomicsstandardsconsortium.github.io/mixs/0010004/'},
|
|
46
|
+
"MAG": {'description': 'Sequences assembled from DNA of mixed community and binned. MAGs are likely to represent a single taxonomic origin. See checkm2 scores for quality assessment.', 'meaning': 'mixs:0010011', 'aliases': ['Mimag']},
|
|
47
|
+
"METAGENOME": {'description': 'Sequences assembled from DNA of mixed community.', 'meaning': 'mixs:0010007', 'aliases': ['Mims']},
|
|
48
|
+
"METATRANSCRIPTOME": {'description': 'Sequences assembled from RNA of mixed community. Currently not represented by GSC.'},
|
|
49
|
+
"SAG": {'description': 'Sequences assembled from DNA of single cell.', 'meaning': 'mixs:0010010', 'aliases': ['Misag']},
|
|
50
|
+
"VIRUS": {'description': 'Sequences assembled from uncultivated virus genome (DNA/RNA).', 'meaning': 'mixs:0010012', 'aliases': ['Miuvig']},
|
|
51
|
+
"MARKER": {'description': 'Sequences from targeted region of DNA; see protocol for information on targeted region. specimen: https://genomicsstandardsconsortium.github.io/mixs/0010009/ survey: https://genomicsstandardsconsortium.github.io/mixs/0010008/'},
|
|
52
|
+
}
|
|
53
|
+
|
|
54
|
+
class StrandType(RichEnum):
|
|
55
|
+
"""
|
|
56
|
+
The strand that a feature appears on relative to a landmark. Also encompasses unknown or irrelevant strandedness.
|
|
57
|
+
"""
|
|
58
|
+
# Enum members
|
|
59
|
+
NEGATIVE = "NEGATIVE"
|
|
60
|
+
POSITIVE = "POSITIVE"
|
|
61
|
+
UNKNOWN = "UNKNOWN"
|
|
62
|
+
UNSTRANDED = "UNSTRANDED"
|
|
63
|
+
|
|
64
|
+
# Set metadata after class creation
|
|
65
|
+
StrandType._metadata = {
|
|
66
|
+
"NEGATIVE": {'description': 'Represented by "-" in a GFF file; the strand is negative wrt the landmark.'},
|
|
67
|
+
"POSITIVE": {'description': 'Represented by "+" in a GFF file; the strand is positive with relation to the landmark.'},
|
|
68
|
+
"UNKNOWN": {'description': 'Represented by "?" in a GFF file. The strandedness is relevant but unknown.'},
|
|
69
|
+
"UNSTRANDED": {'description': 'Represented by "." in a GFF file; the feature is not stranded.'},
|
|
70
|
+
}
|
|
71
|
+
|
|
72
|
+
class SequenceType(RichEnum):
|
|
73
|
+
"""
|
|
74
|
+
The type of sequence being represented.
|
|
75
|
+
"""
|
|
76
|
+
# Enum members
|
|
77
|
+
NUCLEIC_ACID = "NUCLEIC_ACID"
|
|
78
|
+
AMINO_ACID = "AMINO_ACID"
|
|
79
|
+
|
|
80
|
+
# Set metadata after class creation
|
|
81
|
+
SequenceType._metadata = {
|
|
82
|
+
"NUCLEIC_ACID": {'description': 'A nucleic acid sequence, as found in an FNA file.'},
|
|
83
|
+
"AMINO_ACID": {'description': 'An amino acid sequence, as would be found in an FAA file.'},
|
|
84
|
+
}
|
|
85
|
+
|
|
86
|
+
__all__ = [
|
|
87
|
+
"CdsPhaseType",
|
|
88
|
+
"ContigCollectionType",
|
|
89
|
+
"StrandType",
|
|
90
|
+
"SequenceType",
|
|
91
|
+
]
|
|
@@ -0,0 +1,32 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Gene Ontology Aspects
|
|
3
|
+
|
|
4
|
+
The three main aspects of Gene Ontology - Molecular Function, Biological Process, and Cellular Component
|
|
5
|
+
|
|
6
|
+
Generated from: bio/go_aspect.yaml
|
|
7
|
+
"""
|
|
8
|
+
|
|
9
|
+
from __future__ import annotations
|
|
10
|
+
|
|
11
|
+
from typing import Dict, Any, Optional
|
|
12
|
+
from valuesets.generators.rich_enum import RichEnum
|
|
13
|
+
|
|
14
|
+
class GOAspect(RichEnum):
|
|
15
|
+
"""
|
|
16
|
+
The three main aspects (namespaces) of Gene Ontology
|
|
17
|
+
"""
|
|
18
|
+
# Enum members
|
|
19
|
+
F = "F"
|
|
20
|
+
P = "P"
|
|
21
|
+
C = "C"
|
|
22
|
+
|
|
23
|
+
# Set metadata after class creation
|
|
24
|
+
GOAspect._metadata = {
|
|
25
|
+
"F": {'description': 'The activities that occur at the molecular level, such as catalysis or binding', 'meaning': 'GO:0003674', 'aliases': ['molecular_function', 'MF']},
|
|
26
|
+
"P": {'description': 'The larger processes accomplished by multiple molecular activities', 'meaning': 'GO:0008150', 'aliases': ['biological_process', 'BP']},
|
|
27
|
+
"C": {'description': 'The locations relative to cellular structures in which a gene product performs a function', 'meaning': 'GO:0005575', 'aliases': ['cellular_component', 'CC']},
|
|
28
|
+
}
|
|
29
|
+
|
|
30
|
+
__all__ = [
|
|
31
|
+
"GOAspect",
|
|
32
|
+
]
|
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Gene Ontology Causality Value Sets
|
|
3
|
+
|
|
4
|
+
Value sets for GO causal relationships and predicates used in gene ontology annotations and pathway analysis
|
|
5
|
+
|
|
6
|
+
Generated from: bio/go_causality.yaml
|
|
7
|
+
"""
|
|
8
|
+
|
|
9
|
+
from __future__ import annotations
|
|
10
|
+
|
|
11
|
+
from typing import Dict, Any, Optional
|
|
12
|
+
from valuesets.generators.rich_enum import RichEnum
|
|
13
|
+
|
|
14
|
+
class CausalPredicateEnum(RichEnum):
|
|
15
|
+
"""
|
|
16
|
+
A term describing the causal relationship between two activities. All terms are drawn from the "causally upstream or within" (RO:0002418) branch of the Relation Ontology (RO).
|
|
17
|
+
"""
|
|
18
|
+
# Enum members
|
|
19
|
+
CONSTITUTIVELY_UPSTREAM_OF = "CONSTITUTIVELY_UPSTREAM_OF"
|
|
20
|
+
PROVIDES_INPUT_FOR = "PROVIDES_INPUT_FOR"
|
|
21
|
+
REMOVES_INPUT_FOR = "REMOVES_INPUT_FOR"
|
|
22
|
+
CAUSALLY_UPSTREAM_OF = "CAUSALLY_UPSTREAM_OF"
|
|
23
|
+
CAUSALLY_UPSTREAM_OF_POSITIVE_EFFECT = "CAUSALLY_UPSTREAM_OF_POSITIVE_EFFECT"
|
|
24
|
+
CAUSALLY_UPSTREAM_OF_NEGATIVE_EFFECT = "CAUSALLY_UPSTREAM_OF_NEGATIVE_EFFECT"
|
|
25
|
+
REGULATES = "REGULATES"
|
|
26
|
+
NEGATIVELY_REGULATES = "NEGATIVELY_REGULATES"
|
|
27
|
+
POSITIVELY_REGULATES = "POSITIVELY_REGULATES"
|
|
28
|
+
DIRECTLY_NEGATIVELY_REGULATES = "DIRECTLY_NEGATIVELY_REGULATES"
|
|
29
|
+
INDIRECTLY_NEGATIVELY_REGULATES = "INDIRECTLY_NEGATIVELY_REGULATES"
|
|
30
|
+
DIRECTLY_POSITIVELY_REGULATES = "DIRECTLY_POSITIVELY_REGULATES"
|
|
31
|
+
INDIRECTLY_POSITIVELY_REGULATES = "INDIRECTLY_POSITIVELY_REGULATES"
|
|
32
|
+
IS_SMALL_MOLECULE_REGULATOR_OF = "IS_SMALL_MOLECULE_REGULATOR_OF"
|
|
33
|
+
IS_SMALL_MOLECULE_ACTIVATOR_OF = "IS_SMALL_MOLECULE_ACTIVATOR_OF"
|
|
34
|
+
IS_SMALL_MOLECULE_INHIBITOR_OF = "IS_SMALL_MOLECULE_INHIBITOR_OF"
|
|
35
|
+
|
|
36
|
+
# Set metadata after class creation
|
|
37
|
+
CausalPredicateEnum._metadata = {
|
|
38
|
+
"CONSTITUTIVELY_UPSTREAM_OF": {'meaning': 'RO:0012009'},
|
|
39
|
+
"PROVIDES_INPUT_FOR": {'meaning': 'RO:0002413'},
|
|
40
|
+
"REMOVES_INPUT_FOR": {'meaning': 'RO:0012010'},
|
|
41
|
+
"CAUSALLY_UPSTREAM_OF": {'meaning': 'RO:0002411', 'aliases': ['undetermined']},
|
|
42
|
+
"CAUSALLY_UPSTREAM_OF_POSITIVE_EFFECT": {'meaning': 'RO:0002304', 'annotations': {'symbol': '+', 'direction': 'POSITIVE'}},
|
|
43
|
+
"CAUSALLY_UPSTREAM_OF_NEGATIVE_EFFECT": {'meaning': 'RO:0002305', 'annotations': {'symbol': '-', 'direction': 'NEGATIVE'}},
|
|
44
|
+
"REGULATES": {'meaning': 'RO:0002211', 'annotations': {'symbol': 'R'}},
|
|
45
|
+
"NEGATIVELY_REGULATES": {'meaning': 'RO:0002212', 'annotations': {'symbol': '-R', 'direction': 'NEGATIVE'}},
|
|
46
|
+
"POSITIVELY_REGULATES": {'meaning': 'RO:0002213', 'annotations': {'symbol': '+R', 'direction': 'POSITIVE'}},
|
|
47
|
+
"DIRECTLY_NEGATIVELY_REGULATES": {'meaning': 'RO:0002630', 'annotations': {'directness': 'DIRECT', 'direction': 'NEGATIVE'}},
|
|
48
|
+
"INDIRECTLY_NEGATIVELY_REGULATES": {'meaning': 'RO:0002409', 'annotations': {'directness': 'INDIRECT', 'direction': 'NEGATIVE'}},
|
|
49
|
+
"DIRECTLY_POSITIVELY_REGULATES": {'meaning': 'RO:0002629', 'annotations': {'directness': 'DIRECT', 'direction': 'POSITIVE'}},
|
|
50
|
+
"INDIRECTLY_POSITIVELY_REGULATES": {'meaning': 'RO:0002407', 'annotations': {'directness': 'INDIRECT', 'direction': 'POSITIVE'}},
|
|
51
|
+
"IS_SMALL_MOLECULE_REGULATOR_OF": {'meaning': 'RO:0012004'},
|
|
52
|
+
"IS_SMALL_MOLECULE_ACTIVATOR_OF": {'meaning': 'RO:0012005', 'annotations': {'direction': 'POSITIVE'}},
|
|
53
|
+
"IS_SMALL_MOLECULE_INHIBITOR_OF": {'meaning': 'RO:0012006', 'annotations': {'direction': 'NEGATIVE'}},
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
__all__ = [
|
|
57
|
+
"CausalPredicateEnum",
|
|
58
|
+
]
|