valuesets 0.3.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of valuesets might be problematic. Click here for more details.

Files changed (248) hide show
  1. valuesets/__init__.py +7 -0
  2. valuesets/_version.py +8 -0
  3. valuesets/datamodel/valuesets.py +13796 -0
  4. valuesets/datamodel/valuesets_dataclass.py +24503 -0
  5. valuesets/datamodel/valuesets_pydantic.py +13796 -0
  6. valuesets/enums/__init__.py +590 -0
  7. valuesets/enums/academic/__init__.py +1 -0
  8. valuesets/enums/academic/research.py +559 -0
  9. valuesets/enums/analytical_chemistry/__init__.py +1 -0
  10. valuesets/enums/analytical_chemistry/mass_spectrometry.py +198 -0
  11. valuesets/enums/bio/__init__.py +1 -0
  12. valuesets/enums/bio/biological_colors.py +238 -0
  13. valuesets/enums/bio/cell_cycle.py +180 -0
  14. valuesets/enums/bio/currency_chemicals.py +52 -0
  15. valuesets/enums/bio/developmental_stages.py +103 -0
  16. valuesets/enums/bio/genome_features.py +182 -0
  17. valuesets/enums/bio/genomics.py +91 -0
  18. valuesets/enums/bio/go_aspect.py +32 -0
  19. valuesets/enums/bio/go_causality.py +58 -0
  20. valuesets/enums/bio/go_evidence.py +129 -0
  21. valuesets/enums/bio/human_developmental_stages.py +62 -0
  22. valuesets/enums/bio/insdc_geographic_locations.py +591 -0
  23. valuesets/enums/bio/insdc_missing_values.py +49 -0
  24. valuesets/enums/bio/lipid_categories.py +67 -0
  25. valuesets/enums/bio/mouse_developmental_stages.py +62 -0
  26. valuesets/enums/bio/plant_biology.py +86 -0
  27. valuesets/enums/bio/plant_developmental_stages.py +54 -0
  28. valuesets/enums/bio/plant_sex.py +81 -0
  29. valuesets/enums/bio/protein_evidence.py +61 -0
  30. valuesets/enums/bio/proteomics_standards.py +123 -0
  31. valuesets/enums/bio/psi_mi.py +306 -0
  32. valuesets/enums/bio/relationship_to_oxygen.py +37 -0
  33. valuesets/enums/bio/sequence_alphabets.py +449 -0
  34. valuesets/enums/bio/sequence_chemistry.py +357 -0
  35. valuesets/enums/bio/sequencing_platforms.py +302 -0
  36. valuesets/enums/bio/structural_biology.py +320 -0
  37. valuesets/enums/bio/taxonomy.py +238 -0
  38. valuesets/enums/bio/trophic_levels.py +85 -0
  39. valuesets/enums/bio/uniprot_species.py +344 -0
  40. valuesets/enums/bio/viral_genome_types.py +47 -0
  41. valuesets/enums/bioprocessing/__init__.py +1 -0
  42. valuesets/enums/bioprocessing/scale_up.py +249 -0
  43. valuesets/enums/business/__init__.py +1 -0
  44. valuesets/enums/business/human_resources.py +275 -0
  45. valuesets/enums/business/industry_classifications.py +181 -0
  46. valuesets/enums/business/management_operations.py +228 -0
  47. valuesets/enums/business/organizational_structures.py +236 -0
  48. valuesets/enums/business/quality_management.py +181 -0
  49. valuesets/enums/business/supply_chain.py +232 -0
  50. valuesets/enums/chemistry/__init__.py +1 -0
  51. valuesets/enums/chemistry/chemical_entities.py +315 -0
  52. valuesets/enums/chemistry/reaction_directionality.py +65 -0
  53. valuesets/enums/chemistry/reactions.py +256 -0
  54. valuesets/enums/clinical/__init__.py +1 -0
  55. valuesets/enums/clinical/nih_demographics.py +177 -0
  56. valuesets/enums/clinical/phenopackets.py +254 -0
  57. valuesets/enums/common_value_sets.py +8791 -0
  58. valuesets/enums/computing/__init__.py +1 -0
  59. valuesets/enums/computing/file_formats.py +294 -0
  60. valuesets/enums/computing/maturity_levels.py +196 -0
  61. valuesets/enums/computing/mime_types.py +227 -0
  62. valuesets/enums/confidence_levels.py +168 -0
  63. valuesets/enums/contributor.py +30 -0
  64. valuesets/enums/core.py +42 -0
  65. valuesets/enums/data/__init__.py +1 -0
  66. valuesets/enums/data/data_absent_reason.py +53 -0
  67. valuesets/enums/data_science/__init__.py +1 -0
  68. valuesets/enums/data_science/binary_classification.py +87 -0
  69. valuesets/enums/data_science/emotion_classification.py +66 -0
  70. valuesets/enums/data_science/priority_severity.py +73 -0
  71. valuesets/enums/data_science/quality_control.py +46 -0
  72. valuesets/enums/data_science/sentiment_analysis.py +50 -0
  73. valuesets/enums/data_science/text_classification.py +97 -0
  74. valuesets/enums/demographics.py +206 -0
  75. valuesets/enums/ecological_interactions.py +151 -0
  76. valuesets/enums/energy/__init__.py +1 -0
  77. valuesets/enums/energy/energy.py +343 -0
  78. valuesets/enums/energy/fossil_fuels.py +29 -0
  79. valuesets/enums/energy/nuclear/__init__.py +1 -0
  80. valuesets/enums/energy/nuclear/nuclear_facilities.py +195 -0
  81. valuesets/enums/energy/nuclear/nuclear_fuel_cycle.py +96 -0
  82. valuesets/enums/energy/nuclear/nuclear_fuels.py +175 -0
  83. valuesets/enums/energy/nuclear/nuclear_operations.py +191 -0
  84. valuesets/enums/energy/nuclear/nuclear_regulatory.py +188 -0
  85. valuesets/enums/energy/nuclear/nuclear_safety.py +164 -0
  86. valuesets/enums/energy/nuclear/nuclear_waste.py +158 -0
  87. valuesets/enums/energy/nuclear/reactor_types.py +163 -0
  88. valuesets/enums/environmental_health/__init__.py +1 -0
  89. valuesets/enums/environmental_health/exposures.py +265 -0
  90. valuesets/enums/geography/__init__.py +1 -0
  91. valuesets/enums/geography/geographic_codes.py +741 -0
  92. valuesets/enums/health/__init__.py +12 -0
  93. valuesets/enums/health/vaccination.py +98 -0
  94. valuesets/enums/health.py +36 -0
  95. valuesets/enums/health_base.py +36 -0
  96. valuesets/enums/healthcare.py +45 -0
  97. valuesets/enums/industry/__init__.py +1 -0
  98. valuesets/enums/industry/extractive_industry.py +94 -0
  99. valuesets/enums/industry/mining.py +388 -0
  100. valuesets/enums/industry/safety_colors.py +201 -0
  101. valuesets/enums/investigation.py +27 -0
  102. valuesets/enums/materials_science/__init__.py +1 -0
  103. valuesets/enums/materials_science/characterization_methods.py +112 -0
  104. valuesets/enums/materials_science/crystal_structures.py +76 -0
  105. valuesets/enums/materials_science/material_properties.py +119 -0
  106. valuesets/enums/materials_science/material_types.py +104 -0
  107. valuesets/enums/materials_science/pigments_dyes.py +198 -0
  108. valuesets/enums/materials_science/synthesis_methods.py +109 -0
  109. valuesets/enums/medical/__init__.py +1 -0
  110. valuesets/enums/medical/clinical.py +277 -0
  111. valuesets/enums/medical/neuroimaging.py +119 -0
  112. valuesets/enums/mining_processing.py +302 -0
  113. valuesets/enums/physics/__init__.py +1 -0
  114. valuesets/enums/physics/states_of_matter.py +46 -0
  115. valuesets/enums/social/__init__.py +1 -0
  116. valuesets/enums/social/person_status.py +29 -0
  117. valuesets/enums/spatial/__init__.py +1 -0
  118. valuesets/enums/spatial/spatial_qualifiers.py +246 -0
  119. valuesets/enums/statistics/__init__.py +5 -0
  120. valuesets/enums/statistics/prediction_outcomes.py +31 -0
  121. valuesets/enums/statistics.py +31 -0
  122. valuesets/enums/time/__init__.py +1 -0
  123. valuesets/enums/time/temporal.py +254 -0
  124. valuesets/enums/units/__init__.py +1 -0
  125. valuesets/enums/units/measurements.py +310 -0
  126. valuesets/enums/visual/__init__.py +1 -0
  127. valuesets/enums/visual/colors.py +376 -0
  128. valuesets/generators/__init__.py +19 -0
  129. valuesets/generators/auto_slot_injector.py +280 -0
  130. valuesets/generators/enhanced_pydantic_generator.py +100 -0
  131. valuesets/generators/enum_slot_generator.py +201 -0
  132. valuesets/generators/modular_rich_generator.py +353 -0
  133. valuesets/generators/prefix_standardizer.py +198 -0
  134. valuesets/generators/rich_enum.py +127 -0
  135. valuesets/generators/rich_pydantic_generator.py +310 -0
  136. valuesets/generators/smart_slot_syncer.py +428 -0
  137. valuesets/generators/sssom_generator.py +394 -0
  138. valuesets/merged/merged_hierarchy.yaml +21649 -0
  139. valuesets/schema/README.md +3 -0
  140. valuesets/schema/academic/research.yaml +911 -0
  141. valuesets/schema/analytical_chemistry/mass_spectrometry.yaml +206 -0
  142. valuesets/schema/bio/bio_entities.yaml +364 -0
  143. valuesets/schema/bio/biological_colors.yaml +434 -0
  144. valuesets/schema/bio/cell_cycle.yaml +309 -0
  145. valuesets/schema/bio/currency_chemicals.yaml +70 -0
  146. valuesets/schema/bio/developmental_stages.yaml +226 -0
  147. valuesets/schema/bio/genome_features.yaml +342 -0
  148. valuesets/schema/bio/genomics.yaml +101 -0
  149. valuesets/schema/bio/go_aspect.yaml +39 -0
  150. valuesets/schema/bio/go_causality.yaml +119 -0
  151. valuesets/schema/bio/go_evidence.yaml +215 -0
  152. valuesets/schema/bio/insdc_geographic_locations.yaml +911 -0
  153. valuesets/schema/bio/insdc_missing_values.yaml +85 -0
  154. valuesets/schema/bio/lipid_categories.yaml +72 -0
  155. valuesets/schema/bio/plant_biology.yaml +125 -0
  156. valuesets/schema/bio/plant_developmental_stages.yaml +77 -0
  157. valuesets/schema/bio/plant_sex.yaml +108 -0
  158. valuesets/schema/bio/protein_evidence.yaml +63 -0
  159. valuesets/schema/bio/proteomics_standards.yaml +116 -0
  160. valuesets/schema/bio/psi_mi.yaml +400 -0
  161. valuesets/schema/bio/relationship_to_oxygen.yaml +46 -0
  162. valuesets/schema/bio/sequence_alphabets.yaml +1168 -0
  163. valuesets/schema/bio/sequence_chemistry.yaml +477 -0
  164. valuesets/schema/bio/sequencing_platforms.yaml +515 -0
  165. valuesets/schema/bio/structural_biology.yaml +428 -0
  166. valuesets/schema/bio/taxonomy.yaml +453 -0
  167. valuesets/schema/bio/trophic_levels.yaml +118 -0
  168. valuesets/schema/bio/uniprot_species.yaml +1209 -0
  169. valuesets/schema/bio/viral_genome_types.yaml +99 -0
  170. valuesets/schema/bioprocessing/scale_up.yaml +458 -0
  171. valuesets/schema/business/human_resources.yaml +752 -0
  172. valuesets/schema/business/industry_classifications.yaml +448 -0
  173. valuesets/schema/business/management_operations.yaml +602 -0
  174. valuesets/schema/business/organizational_structures.yaml +645 -0
  175. valuesets/schema/business/quality_management.yaml +502 -0
  176. valuesets/schema/business/supply_chain.yaml +688 -0
  177. valuesets/schema/chemistry/chemical_entities.yaml +639 -0
  178. valuesets/schema/chemistry/reaction_directionality.yaml +60 -0
  179. valuesets/schema/chemistry/reactions.yaml +442 -0
  180. valuesets/schema/clinical/nih_demographics.yaml +285 -0
  181. valuesets/schema/clinical/phenopackets.yaml +429 -0
  182. valuesets/schema/computing/file_formats.yaml +631 -0
  183. valuesets/schema/computing/maturity_levels.yaml +229 -0
  184. valuesets/schema/computing/mime_types.yaml +266 -0
  185. valuesets/schema/confidence_levels.yaml +206 -0
  186. valuesets/schema/contributor.yaml +30 -0
  187. valuesets/schema/core.yaml +55 -0
  188. valuesets/schema/data/data_absent_reason.yaml +82 -0
  189. valuesets/schema/data_science/binary_classification.yaml +125 -0
  190. valuesets/schema/data_science/emotion_classification.yaml +109 -0
  191. valuesets/schema/data_science/priority_severity.yaml +122 -0
  192. valuesets/schema/data_science/quality_control.yaml +68 -0
  193. valuesets/schema/data_science/sentiment_analysis.yaml +81 -0
  194. valuesets/schema/data_science/text_classification.yaml +135 -0
  195. valuesets/schema/demographics.yaml +238 -0
  196. valuesets/schema/ecological_interactions.yaml +298 -0
  197. valuesets/schema/energy/energy.yaml +595 -0
  198. valuesets/schema/energy/fossil_fuels.yaml +28 -0
  199. valuesets/schema/energy/nuclear/nuclear_facilities.yaml +463 -0
  200. valuesets/schema/energy/nuclear/nuclear_fuel_cycle.yaml +82 -0
  201. valuesets/schema/energy/nuclear/nuclear_fuels.yaml +421 -0
  202. valuesets/schema/energy/nuclear/nuclear_operations.yaml +480 -0
  203. valuesets/schema/energy/nuclear/nuclear_regulatory.yaml +200 -0
  204. valuesets/schema/energy/nuclear/nuclear_safety.yaml +352 -0
  205. valuesets/schema/energy/nuclear/nuclear_waste.yaml +332 -0
  206. valuesets/schema/energy/nuclear/reactor_types.yaml +394 -0
  207. valuesets/schema/environmental_health/exposures.yaml +355 -0
  208. valuesets/schema/generated_slots.yaml +1828 -0
  209. valuesets/schema/geography/geographic_codes.yaml +1018 -0
  210. valuesets/schema/health/vaccination.yaml +102 -0
  211. valuesets/schema/health.yaml +38 -0
  212. valuesets/schema/healthcare.yaml +53 -0
  213. valuesets/schema/industry/extractive_industry.yaml +89 -0
  214. valuesets/schema/industry/mining.yaml +888 -0
  215. valuesets/schema/industry/safety_colors.yaml +375 -0
  216. valuesets/schema/investigation.yaml +64 -0
  217. valuesets/schema/materials_science/characterization_methods.yaml +193 -0
  218. valuesets/schema/materials_science/crystal_structures.yaml +138 -0
  219. valuesets/schema/materials_science/material_properties.yaml +135 -0
  220. valuesets/schema/materials_science/material_types.yaml +151 -0
  221. valuesets/schema/materials_science/pigments_dyes.yaml +465 -0
  222. valuesets/schema/materials_science/synthesis_methods.yaml +186 -0
  223. valuesets/schema/medical/clinical.yaml +610 -0
  224. valuesets/schema/medical/neuroimaging.yaml +325 -0
  225. valuesets/schema/mining_processing.yaml +295 -0
  226. valuesets/schema/physics/states_of_matter.yaml +46 -0
  227. valuesets/schema/slot_mixins.yaml +143 -0
  228. valuesets/schema/social/person_status.yaml +28 -0
  229. valuesets/schema/spatial/spatial_qualifiers.yaml +466 -0
  230. valuesets/schema/statistics/prediction_outcomes.yaml +26 -0
  231. valuesets/schema/statistics.yaml +34 -0
  232. valuesets/schema/time/temporal.yaml +435 -0
  233. valuesets/schema/types.yaml +15 -0
  234. valuesets/schema/units/measurements.yaml +675 -0
  235. valuesets/schema/valuesets.yaml +100 -0
  236. valuesets/schema/visual/colors.yaml +778 -0
  237. valuesets/utils/__init__.py +6 -0
  238. valuesets/utils/comparison.py +102 -0
  239. valuesets/utils/expand_dynamic_enums.py +414 -0
  240. valuesets/utils/mapping_utils.py +236 -0
  241. valuesets/validators/__init__.py +11 -0
  242. valuesets/validators/enum_evaluator.py +669 -0
  243. valuesets/validators/oak_config.yaml +70 -0
  244. valuesets/validators/validate_with_ols.py +241 -0
  245. valuesets-0.3.1.dist-info/METADATA +395 -0
  246. valuesets-0.3.1.dist-info/RECORD +248 -0
  247. valuesets-0.3.1.dist-info/WHEEL +4 -0
  248. valuesets-0.3.1.dist-info/licenses/LICENSE +201 -0
@@ -0,0 +1,342 @@
1
+ name: genome_features
2
+ title: Genome Feature Types
3
+ description: 'Genome feature types from SOFA (Sequence Ontology Feature Annotation),
4
+
5
+ the subset of SO used in GFF3 files for genome annotation.
6
+
7
+ Organized hierarchically following the Sequence Ontology structure.'
8
+ id: https://w3id.org/linkml/valuesets/bio/genome_features
9
+ imports:
10
+ - linkml:types
11
+ prefixes:
12
+ valuesets: https://w3id.org/valuesets/
13
+ SO: http://purl.obolibrary.org/obo/SO_
14
+ default_prefix: valuesets
15
+ slots:
16
+ genome_feature:
17
+ description: Genome feature types from SOFA (Sequence Ontology Feature Annotation)
18
+ range: GenomeFeatureType
19
+ multivalued: true
20
+ enums:
21
+ GenomeFeatureType:
22
+ description: 'Genome feature types from SOFA (Sequence Ontology Feature Annotation).
23
+
24
+ This is the subset of Sequence Ontology terms used in GFF3 files.
25
+
26
+ Organized hierarchically following the Sequence Ontology structure.'
27
+ permissible_values:
28
+ REGION:
29
+ description: A sequence feature with an extent greater than zero
30
+ meaning: SO:0000001
31
+ BIOLOGICAL_REGION:
32
+ description: A region defined by its biological properties
33
+ meaning: SO:0001411
34
+ is_a: REGION
35
+ GENE:
36
+ description: A region (or regions) that includes all of the sequence elements necessary to encode a functional transcript
37
+ meaning: SO:0000704
38
+ is_a: BIOLOGICAL_REGION
39
+ TRANSCRIPT:
40
+ description: An RNA synthesized on a DNA or RNA template by an RNA polymerase
41
+ meaning: SO:0000673
42
+ is_a: BIOLOGICAL_REGION
43
+ PRIMARY_TRANSCRIPT:
44
+ description: A transcript that has not been processed
45
+ meaning: SO:0000185
46
+ is_a: TRANSCRIPT
47
+ MRNA:
48
+ description: Messenger RNA; includes 5'UTR, coding sequences and 3'UTR
49
+ meaning: SO:0000234
50
+ is_a: TRANSCRIPT
51
+ EXON:
52
+ description: A region of the transcript sequence within a gene which is not removed from the primary RNA transcript
53
+ by RNA splicing
54
+ meaning: SO:0000147
55
+ is_a: BIOLOGICAL_REGION
56
+ CDS:
57
+ description: Coding sequence; sequence of nucleotides that corresponds with the sequence of amino acids in a protein
58
+ meaning: SO:0000316
59
+ is_a: BIOLOGICAL_REGION
60
+ INTRON:
61
+ description: A region of a primary transcript that is transcribed, but removed from within the transcript by splicing
62
+ meaning: SO:0000188
63
+ is_a: BIOLOGICAL_REGION
64
+ FIVE_PRIME_UTR:
65
+ description: 5' untranslated region
66
+ meaning: SO:0000204
67
+ is_a: BIOLOGICAL_REGION
68
+ THREE_PRIME_UTR:
69
+ description: 3' untranslated region
70
+ meaning: SO:0000205
71
+ is_a: BIOLOGICAL_REGION
72
+ NCRNA:
73
+ description: Non-protein coding RNA
74
+ meaning: SO:0000655
75
+ is_a: TRANSCRIPT
76
+ RRNA:
77
+ description: Ribosomal RNA
78
+ meaning: SO:0000252
79
+ is_a: NCRNA
80
+ structured_aliases:
81
+ - literal_form: rRNA
82
+ source: SO:0000252
83
+ TRNA:
84
+ description: Transfer RNA
85
+ meaning: SO:0000253
86
+ is_a: NCRNA
87
+ SNRNA:
88
+ description: Small nuclear RNA
89
+ meaning: SO:0000274
90
+ is_a: NCRNA
91
+ SNORNA:
92
+ description: Small nucleolar RNA
93
+ meaning: SO:0000275
94
+ is_a: NCRNA
95
+ MIRNA:
96
+ description: MicroRNA
97
+ meaning: SO:0000276
98
+ is_a: NCRNA
99
+ LNCRNA:
100
+ description: Long non-coding RNA
101
+ meaning: SO:0001877
102
+ is_a: NCRNA
103
+ RIBOZYME:
104
+ description: An RNA with catalytic activity
105
+ meaning: SO:0000374
106
+ is_a: NCRNA
107
+ ANTISENSE_RNA:
108
+ description: RNA that is complementary to other RNA
109
+ meaning: SO:0000644
110
+ is_a: NCRNA
111
+ PSEUDOGENE:
112
+ description: A sequence that closely resembles a known functional gene but does not produce a functional product
113
+ meaning: SO:0000336
114
+ is_a: BIOLOGICAL_REGION
115
+ PROCESSED_PSEUDOGENE:
116
+ description: A pseudogene arising from reverse transcription of mRNA
117
+ meaning: SO:0000043
118
+ is_a: PSEUDOGENE
119
+ REGULATORY_REGION:
120
+ description: A region involved in the control of the process of gene expression
121
+ meaning: SO:0005836
122
+ is_a: BIOLOGICAL_REGION
123
+ PROMOTER:
124
+ description: A regulatory region initiating transcription
125
+ meaning: SO:0000167
126
+ is_a: REGULATORY_REGION
127
+ ENHANCER:
128
+ description: A cis-acting sequence that increases transcription
129
+ meaning: SO:0000165
130
+ is_a: REGULATORY_REGION
131
+ SILENCER:
132
+ description: A regulatory region which upon binding of transcription factors, suppresses transcription
133
+ meaning: SO:0000625
134
+ is_a: REGULATORY_REGION
135
+ TERMINATOR:
136
+ description: The sequence of DNA located either at the end of the transcript that causes RNA polymerase to terminate
137
+ transcription
138
+ meaning: SO:0000141
139
+ is_a: REGULATORY_REGION
140
+ ATTENUATOR:
141
+ description: A sequence that causes transcription termination
142
+ meaning: SO:0000140
143
+ is_a: REGULATORY_REGION
144
+ POLYA_SIGNAL_SEQUENCE:
145
+ description: The recognition sequence for the cleavage and polyadenylation machinery
146
+ meaning: SO:0000551
147
+ is_a: REGULATORY_REGION
148
+ BINDING_SITE:
149
+ description: A region on a molecule that binds to another molecule
150
+ meaning: SO:0000409
151
+ is_a: BIOLOGICAL_REGION
152
+ TFBS:
153
+ title: TF_binding_site
154
+ description: Transcription factor binding site
155
+ meaning: SO:0000235
156
+ is_a: BINDING_SITE
157
+ RIBOSOME_ENTRY_SITE:
158
+ description: Region where ribosome assembles on mRNA
159
+ meaning: SO:0000139
160
+ is_a: BINDING_SITE
161
+ POLYA_SITE:
162
+ description: Polyadenylation site
163
+ meaning: SO:0000553
164
+ is_a: BIOLOGICAL_REGION
165
+ REPEAT_REGION:
166
+ description: A region of sequence containing one or more repeat units
167
+ meaning: SO:0000657
168
+ is_a: BIOLOGICAL_REGION
169
+ DISPERSED_REPEAT:
170
+ description: A repeat that is interspersed in the genome
171
+ meaning: SO:0000658
172
+ is_a: REPEAT_REGION
173
+ TANDEM_REPEAT:
174
+ description: A repeat where the same sequence is repeated in the same orientation
175
+ meaning: SO:0000705
176
+ is_a: REPEAT_REGION
177
+ INVERTED_REPEAT:
178
+ description: A repeat where the sequence is repeated in the opposite orientation
179
+ meaning: SO:0000294
180
+ is_a: REPEAT_REGION
181
+ TRANSPOSABLE_ELEMENT:
182
+ description: A DNA segment that can change its position within the genome
183
+ meaning: SO:0000101
184
+ is_a: BIOLOGICAL_REGION
185
+ MOBILE_ELEMENT:
186
+ title: mobile_genetic_element
187
+ description: A nucleotide region with the ability to move from one place in the genome to another
188
+ meaning: SO:0001037
189
+ is_a: BIOLOGICAL_REGION
190
+ SEQUENCE_ALTERATION:
191
+ description: A sequence that deviates from the reference sequence
192
+ meaning: SO:0001059
193
+ is_a: REGION
194
+ INSERTION:
195
+ description: The sequence of one or more nucleotides added between two adjacent nucleotides
196
+ meaning: SO:0000667
197
+ is_a: SEQUENCE_ALTERATION
198
+ DELETION:
199
+ description: The removal of a sequences of nucleotides from the genome
200
+ meaning: SO:0000159
201
+ is_a: SEQUENCE_ALTERATION
202
+ INVERSION:
203
+ description: A continuous nucleotide sequence is inverted in the same position
204
+ meaning: SO:1000036
205
+ is_a: SEQUENCE_ALTERATION
206
+ DUPLICATION:
207
+ description: One or more nucleotides are added between two adjacent nucleotides
208
+ meaning: SO:1000035
209
+ is_a: SEQUENCE_ALTERATION
210
+ SUBSTITUTION:
211
+ description: A sequence alteration where one nucleotide replaced by another
212
+ meaning: SO:1000002
213
+ is_a: SEQUENCE_ALTERATION
214
+ ORIGIN_OF_REPLICATION:
215
+ description: The origin of replication; starting site for duplication of a nucleic acid molecule
216
+ meaning: SO:0000296
217
+ is_a: BIOLOGICAL_REGION
218
+ POLYC_TRACT:
219
+ description: A sequence of Cs
220
+ is_a: REGION
221
+ GAP:
222
+ description: A gap in the sequence
223
+ meaning: SO:0000730
224
+ is_a: REGION
225
+ ASSEMBLY_GAP:
226
+ title: gap
227
+ description: A gap between two sequences in an assembly
228
+ meaning: SO:0000730
229
+ is_a: GAP
230
+ CHROMOSOME:
231
+ description: Structural unit composed of DNA and proteins
232
+ meaning: SO:0000340
233
+ is_a: REGION
234
+ SUPERCONTIG:
235
+ description: One or more contigs that have been ordered and oriented using end-read information
236
+ meaning: SO:0000148
237
+ is_a: REGION
238
+ CONTIG:
239
+ description: A contiguous sequence derived from sequence assembly
240
+ meaning: SO:0000149
241
+ is_a: REGION
242
+ SCAFFOLD:
243
+ title: supercontig
244
+ description: One or more contigs that have been ordered and oriented
245
+ meaning: SO:0000148
246
+ is_a: REGION
247
+ CLONE:
248
+ description: A piece of DNA that has been inserted into a vector
249
+ meaning: SO:0000151
250
+ is_a: REGION
251
+ PLASMID:
252
+ description: A self-replicating circular DNA molecule
253
+ meaning: SO:0000155
254
+ is_a: REGION
255
+ POLYPEPTIDE:
256
+ description: A sequence of amino acids linked by peptide bonds
257
+ meaning: SO:0000104
258
+ is_a: REGION
259
+ MATURE_PROTEIN_REGION:
260
+ description: The polypeptide sequence that remains after post-translational processing
261
+ meaning: SO:0000419
262
+ is_a: POLYPEPTIDE
263
+ SIGNAL_PEPTIDE:
264
+ description: A peptide region that targets a polypeptide to a specific location
265
+ meaning: SO:0000418
266
+ is_a: POLYPEPTIDE
267
+ TRANSIT_PEPTIDE:
268
+ description: A peptide that directs the transport of a protein to an organelle
269
+ meaning: SO:0000725
270
+ is_a: POLYPEPTIDE
271
+ PROPEPTIDE:
272
+ title: propeptide
273
+ description: A peptide region that is cleaved during maturation
274
+ meaning: SO:0001062
275
+ is_a: POLYPEPTIDE
276
+ OPERON:
277
+ description: A group of contiguous genes transcribed as a single unit
278
+ meaning: SO:0000178
279
+ is_a: BIOLOGICAL_REGION
280
+ STEM_LOOP:
281
+ description: A double-helical region formed by base-pairing between adjacent sequences
282
+ meaning: SO:0000313
283
+ is_a: REGION
284
+ D_LOOP:
285
+ description: Displacement loop; a region where DNA is displaced by an invading strand
286
+ meaning: SO:0000297
287
+ is_a: REGION
288
+ MATCH:
289
+ description: A region of sequence similarity
290
+ meaning: SO:0000343
291
+ is_a: REGION
292
+ CDNA_MATCH:
293
+ description: A match to a cDNA sequence
294
+ meaning: SO:0000689
295
+ is_a: MATCH
296
+ EST_MATCH:
297
+ description: A match to an EST sequence
298
+ meaning: SO:0000668
299
+ is_a: MATCH
300
+ PROTEIN_MATCH:
301
+ description: A match to a protein sequence
302
+ meaning: SO:0000349
303
+ is_a: MATCH
304
+ NUCLEOTIDE_MATCH:
305
+ description: A match to a nucleotide sequence
306
+ meaning: SO:0000347
307
+ is_a: MATCH
308
+ JUNCTION_FEATURE:
309
+ title: junction
310
+ description: A boundary or junction between sequence regions
311
+ meaning: SO:0000699
312
+ is_a: BIOLOGICAL_REGION
313
+ SPLICE_SITE:
314
+ description: The position where intron is excised
315
+ meaning: SO:0000162
316
+ is_a: JUNCTION_FEATURE
317
+ FIVE_PRIME_SPLICE_SITE:
318
+ title: five_prime_cis_splice_site
319
+ description: The 5' splice site (donor site)
320
+ meaning: SO:0000163
321
+ is_a: SPLICE_SITE
322
+ THREE_PRIME_SPLICE_SITE:
323
+ title: three_prime_cis_splice_site
324
+ description: The 3' splice site (acceptor site)
325
+ meaning: SO:0000164
326
+ is_a: SPLICE_SITE
327
+ START_CODON:
328
+ description: The first codon to be translated
329
+ meaning: SO:0000318
330
+ is_a: BIOLOGICAL_REGION
331
+ STOP_CODON:
332
+ description: The codon that terminates translation
333
+ meaning: SO:0000319
334
+ is_a: BIOLOGICAL_REGION
335
+ CENTROMERE:
336
+ description: A region where chromatids are held together
337
+ meaning: SO:0000577
338
+ is_a: BIOLOGICAL_REGION
339
+ TELOMERE:
340
+ description: The terminal region of a linear chromosome
341
+ meaning: SO:0000624
342
+ is_a: BIOLOGICAL_REGION
@@ -0,0 +1,101 @@
1
+ name: genomics
2
+ title: Genomics Value Sets
3
+ description: Value sets related to genomics and sequencing
4
+ id: https://w3id.org/common-value-sets/genomics
5
+ imports:
6
+ - linkml:types
7
+ prefixes:
8
+ CVS: https://w3id.org/common-value-sets/
9
+ linkml: https://w3id.org/linkml/
10
+ mixs: https://genomicsstandardsconsortium.github.io/mixs/
11
+ valuesets: https://w3id.org/valuesets/
12
+ default_prefix: valuesets
13
+ slots:
14
+ cds_phase:
15
+ description: For features of type CDS (coding sequence), the phase indicates where the feature begins with reference to
16
+ the reading frame
17
+ range: CdsPhaseType
18
+ contig_collection:
19
+ description: The type of the contig set; the type of the 'omics data set
20
+ range: ContigCollectionType
21
+ strand:
22
+ description: The strand that a feature appears on relative to a landmark
23
+ range: StrandType
24
+ sequence:
25
+ description: The type of sequence being represented
26
+ range: SequenceType
27
+ enums:
28
+ CdsPhaseType:
29
+ description: For features of type CDS (coding sequence), the phase indicates where the feature begins with reference to
30
+ the reading frame. The phase is one of the integers 0, 1, or 2, indicating the number of bases that should be removed
31
+ from the beginning of this feature to reach the first base of the next codon.
32
+ permissible_values:
33
+ PHASE_0:
34
+ description: Zero bases from reading frame to feature start.
35
+ title: '0'
36
+ PHASE_1:
37
+ description: One base from reading frame to feature start.
38
+ title: '1'
39
+ PHASE_2:
40
+ description: Two bases from reading frame to feature start.
41
+ title: '2'
42
+ ContigCollectionType:
43
+ description: The type of the contig set; the type of the 'omics data set. Terms are taken from the Genomics Standards
44
+ Consortium where possible. See the GSC checklists at https://genomicsstandardsconsortium.github.io/mixs/ for the controlled
45
+ vocabularies used.
46
+ permissible_values:
47
+ ISOLATE:
48
+ description: 'Sequences assembled from DNA of isolated organism. Bacteria/Archaea: https://genomicsstandardsconsortium.github.io/mixs/0010003/
49
+ Euk: https://genomicsstandardsconsortium.github.io/mixs/0010002/ Virus: https://genomicsstandardsconsortium.github.io/mixs/0010005/
50
+ Organelle: https://genomicsstandardsconsortium.github.io/mixs/0010006/ Plasmid: https://genomicsstandardsconsortium.github.io/mixs/0010004/'
51
+ MAG:
52
+ description: Sequences assembled from DNA of mixed community and binned. MAGs are likely to represent a single taxonomic
53
+ origin. See checkm2 scores for quality assessment.
54
+ meaning: mixs:0010011
55
+ title: Metagenome-Assembled Genome
56
+ aliases:
57
+ - Mimag
58
+ METAGENOME:
59
+ description: Sequences assembled from DNA of mixed community.
60
+ meaning: mixs:0010007
61
+ aliases:
62
+ - Mims
63
+ METATRANSCRIPTOME:
64
+ description: Sequences assembled from RNA of mixed community. Currently not represented by GSC.
65
+ SAG:
66
+ description: Sequences assembled from DNA of single cell.
67
+ meaning: mixs:0010010
68
+ title: Single Amplified Genome
69
+ aliases:
70
+ - Misag
71
+ VIRUS:
72
+ description: Sequences assembled from uncultivated virus genome (DNA/RNA).
73
+ meaning: mixs:0010012
74
+ aliases:
75
+ - Miuvig
76
+ MARKER:
77
+ description: 'Sequences from targeted region of DNA; see protocol for information on targeted region. specimen: https://genomicsstandardsconsortium.github.io/mixs/0010009/
78
+ survey: https://genomicsstandardsconsortium.github.io/mixs/0010008/'
79
+ StrandType:
80
+ description: The strand that a feature appears on relative to a landmark. Also encompasses unknown or irrelevant strandedness.
81
+ permissible_values:
82
+ NEGATIVE:
83
+ description: Represented by "-" in a GFF file; the strand is negative wrt the landmark.
84
+ title: negative
85
+ POSITIVE:
86
+ description: Represented by "+" in a GFF file; the strand is positive with relation to the landmark.
87
+ title: positive
88
+ UNKNOWN:
89
+ description: Represented by "?" in a GFF file. The strandedness is relevant but unknown.
90
+ title: unknown
91
+ UNSTRANDED:
92
+ description: Represented by "." in a GFF file; the feature is not stranded.
93
+ title: unstranded
94
+ SequenceType:
95
+ description: The type of sequence being represented.
96
+ permissible_values:
97
+ NUCLEIC_ACID:
98
+ description: A nucleic acid sequence, as found in an FNA file.
99
+ AMINO_ACID:
100
+ description: An amino acid sequence, as would be found in an FAA file.
101
+ default_range: string
@@ -0,0 +1,39 @@
1
+ name: go_aspect
2
+ title: Gene Ontology Aspects
3
+ description: The three main aspects of Gene Ontology - Molecular Function, Biological Process, and Cellular Component
4
+ id: https://w3id.org/linkml/valuesets/bio/go_aspect
5
+ imports:
6
+ - linkml:types
7
+ prefixes:
8
+ valuesets: https://w3id.org/valuesets/
9
+ GO: http://purl.obolibrary.org/obo/GO_
10
+ default_prefix: valuesets
11
+ slots:
12
+ go_aspect:
13
+ description: Gene Ontology aspect (namespace) - one of molecular function, biological process, or cellular component
14
+ range: GOAspect
15
+ enums:
16
+ GOAspect:
17
+ description: The three main aspects (namespaces) of Gene Ontology
18
+ permissible_values:
19
+ F:
20
+ title: Molecular Function
21
+ description: The activities that occur at the molecular level, such as catalysis or binding
22
+ aliases:
23
+ - molecular_function
24
+ - MF
25
+ meaning: GO:0003674
26
+ P:
27
+ title: Biological Process
28
+ description: The larger processes accomplished by multiple molecular activities
29
+ aliases:
30
+ - biological_process
31
+ - BP
32
+ meaning: GO:0008150
33
+ C:
34
+ title: Cellular Component
35
+ description: The locations relative to cellular structures in which a gene product performs a function
36
+ aliases:
37
+ - cellular_component
38
+ - CC
39
+ meaning: GO:0005575
@@ -0,0 +1,119 @@
1
+ name: go_causality
2
+ title: Gene Ontology Causality Value Sets
3
+ description: Value sets for GO causal relationships and predicates used in gene ontology annotations and pathway analysis
4
+ id: https://w3id.org/valuesets/bio/go_causality
5
+ imports:
6
+ - linkml:types
7
+ prefixes:
8
+ linkml: https://w3id.org/linkml/
9
+ RO: http://purl.obolibrary.org/obo/RO_
10
+ valuesets: https://w3id.org/valuesets/
11
+ default_prefix: valuesets
12
+ slots:
13
+ causal_predicate:
14
+ description: A term describing the causal relationship between two activities drawn from the Relation Ontology
15
+ range: CausalPredicateEnum
16
+ enums:
17
+ CausalPredicateEnum:
18
+ description: A term describing the causal relationship between two activities. All terms are drawn from
19
+ the "causally upstream or within" (RO:0002418) branch of the Relation Ontology (RO).
20
+ permissible_values:
21
+ CONSTITUTIVELY_UPSTREAM_OF:
22
+ title: constitutively upstream of
23
+ meaning: RO:0012009
24
+ PROVIDES_INPUT_FOR:
25
+ title: provides input for
26
+ meaning: RO:0002413
27
+ REMOVES_INPUT_FOR:
28
+ title: removes input for
29
+ meaning: RO:0012010
30
+ CAUSALLY_UPSTREAM_OF:
31
+ title: causally upstream of
32
+ meaning: RO:0002411
33
+ aliases:
34
+ - undetermined
35
+ comments:
36
+ - Abstract parent class for causal relationships
37
+ CAUSALLY_UPSTREAM_OF_POSITIVE_EFFECT:
38
+ title: causally upstream of, positive effect
39
+ is_a: CAUSALLY_UPSTREAM_OF
40
+ meaning: RO:0002304
41
+ annotations:
42
+ symbol: "+"
43
+ direction: POSITIVE
44
+ CAUSALLY_UPSTREAM_OF_NEGATIVE_EFFECT:
45
+ title: causally upstream of, negative effect
46
+ is_a: CAUSALLY_UPSTREAM_OF
47
+ meaning: RO:0002305
48
+ annotations:
49
+ symbol: "-"
50
+ direction: NEGATIVE
51
+ REGULATES:
52
+ title: regulates
53
+ is_a: CAUSALLY_UPSTREAM_OF
54
+ meaning: RO:0002211
55
+ annotations:
56
+ symbol: "R"
57
+ comments:
58
+ - Abstract parent class for regulation relationships
59
+ NEGATIVELY_REGULATES:
60
+ title: negatively regulates
61
+ is_a: REGULATES
62
+ meaning: RO:0002212
63
+ annotations:
64
+ symbol: "-R"
65
+ direction: NEGATIVE
66
+ comments:
67
+ - Abstract parent class for negative regulation relationships
68
+ POSITIVELY_REGULATES:
69
+ title: positively regulates
70
+ is_a: REGULATES
71
+ meaning: RO:0002213
72
+ annotations:
73
+ symbol: "+R"
74
+ direction: POSITIVE
75
+ comments:
76
+ - Abstract parent class for positive regulation relationships
77
+ DIRECTLY_NEGATIVELY_REGULATES:
78
+ title: directly negatively regulates
79
+ is_a: NEGATIVELY_REGULATES
80
+ meaning: RO:0002630
81
+ annotations:
82
+ directness: DIRECT
83
+ direction: NEGATIVE
84
+ INDIRECTLY_NEGATIVELY_REGULATES:
85
+ title: indirectly negatively regulates
86
+ is_a: NEGATIVELY_REGULATES
87
+ meaning: RO:0002409
88
+ annotations:
89
+ directness: INDIRECT
90
+ direction: NEGATIVE
91
+ DIRECTLY_POSITIVELY_REGULATES:
92
+ title: directly positively regulates
93
+ is_a: POSITIVELY_REGULATES
94
+ meaning: RO:0002629
95
+ annotations:
96
+ directness: DIRECT
97
+ direction: POSITIVE
98
+ INDIRECTLY_POSITIVELY_REGULATES:
99
+ title: indirectly positively regulates
100
+ is_a: POSITIVELY_REGULATES
101
+ meaning: RO:0002407
102
+ annotations:
103
+ directness: INDIRECT
104
+ direction: POSITIVE
105
+ IS_SMALL_MOLECULE_REGULATOR_OF:
106
+ title: is small molecule regulator of
107
+ meaning: RO:0012004
108
+ IS_SMALL_MOLECULE_ACTIVATOR_OF:
109
+ title: is small molecule activator of
110
+ is_a: IS_SMALL_MOLECULE_REGULATOR_OF
111
+ meaning: RO:0012005
112
+ annotations:
113
+ direction: POSITIVE
114
+ IS_SMALL_MOLECULE_INHIBITOR_OF:
115
+ title: is small molecule inhibitor of
116
+ is_a: IS_SMALL_MOLECULE_REGULATOR_OF
117
+ meaning: RO:0012006
118
+ annotations:
119
+ direction: NEGATIVE