valuesets 0.3.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of valuesets might be problematic. Click here for more details.

Files changed (248) hide show
  1. valuesets/__init__.py +7 -0
  2. valuesets/_version.py +8 -0
  3. valuesets/datamodel/valuesets.py +13796 -0
  4. valuesets/datamodel/valuesets_dataclass.py +24503 -0
  5. valuesets/datamodel/valuesets_pydantic.py +13796 -0
  6. valuesets/enums/__init__.py +590 -0
  7. valuesets/enums/academic/__init__.py +1 -0
  8. valuesets/enums/academic/research.py +559 -0
  9. valuesets/enums/analytical_chemistry/__init__.py +1 -0
  10. valuesets/enums/analytical_chemistry/mass_spectrometry.py +198 -0
  11. valuesets/enums/bio/__init__.py +1 -0
  12. valuesets/enums/bio/biological_colors.py +238 -0
  13. valuesets/enums/bio/cell_cycle.py +180 -0
  14. valuesets/enums/bio/currency_chemicals.py +52 -0
  15. valuesets/enums/bio/developmental_stages.py +103 -0
  16. valuesets/enums/bio/genome_features.py +182 -0
  17. valuesets/enums/bio/genomics.py +91 -0
  18. valuesets/enums/bio/go_aspect.py +32 -0
  19. valuesets/enums/bio/go_causality.py +58 -0
  20. valuesets/enums/bio/go_evidence.py +129 -0
  21. valuesets/enums/bio/human_developmental_stages.py +62 -0
  22. valuesets/enums/bio/insdc_geographic_locations.py +591 -0
  23. valuesets/enums/bio/insdc_missing_values.py +49 -0
  24. valuesets/enums/bio/lipid_categories.py +67 -0
  25. valuesets/enums/bio/mouse_developmental_stages.py +62 -0
  26. valuesets/enums/bio/plant_biology.py +86 -0
  27. valuesets/enums/bio/plant_developmental_stages.py +54 -0
  28. valuesets/enums/bio/plant_sex.py +81 -0
  29. valuesets/enums/bio/protein_evidence.py +61 -0
  30. valuesets/enums/bio/proteomics_standards.py +123 -0
  31. valuesets/enums/bio/psi_mi.py +306 -0
  32. valuesets/enums/bio/relationship_to_oxygen.py +37 -0
  33. valuesets/enums/bio/sequence_alphabets.py +449 -0
  34. valuesets/enums/bio/sequence_chemistry.py +357 -0
  35. valuesets/enums/bio/sequencing_platforms.py +302 -0
  36. valuesets/enums/bio/structural_biology.py +320 -0
  37. valuesets/enums/bio/taxonomy.py +238 -0
  38. valuesets/enums/bio/trophic_levels.py +85 -0
  39. valuesets/enums/bio/uniprot_species.py +344 -0
  40. valuesets/enums/bio/viral_genome_types.py +47 -0
  41. valuesets/enums/bioprocessing/__init__.py +1 -0
  42. valuesets/enums/bioprocessing/scale_up.py +249 -0
  43. valuesets/enums/business/__init__.py +1 -0
  44. valuesets/enums/business/human_resources.py +275 -0
  45. valuesets/enums/business/industry_classifications.py +181 -0
  46. valuesets/enums/business/management_operations.py +228 -0
  47. valuesets/enums/business/organizational_structures.py +236 -0
  48. valuesets/enums/business/quality_management.py +181 -0
  49. valuesets/enums/business/supply_chain.py +232 -0
  50. valuesets/enums/chemistry/__init__.py +1 -0
  51. valuesets/enums/chemistry/chemical_entities.py +315 -0
  52. valuesets/enums/chemistry/reaction_directionality.py +65 -0
  53. valuesets/enums/chemistry/reactions.py +256 -0
  54. valuesets/enums/clinical/__init__.py +1 -0
  55. valuesets/enums/clinical/nih_demographics.py +177 -0
  56. valuesets/enums/clinical/phenopackets.py +254 -0
  57. valuesets/enums/common_value_sets.py +8791 -0
  58. valuesets/enums/computing/__init__.py +1 -0
  59. valuesets/enums/computing/file_formats.py +294 -0
  60. valuesets/enums/computing/maturity_levels.py +196 -0
  61. valuesets/enums/computing/mime_types.py +227 -0
  62. valuesets/enums/confidence_levels.py +168 -0
  63. valuesets/enums/contributor.py +30 -0
  64. valuesets/enums/core.py +42 -0
  65. valuesets/enums/data/__init__.py +1 -0
  66. valuesets/enums/data/data_absent_reason.py +53 -0
  67. valuesets/enums/data_science/__init__.py +1 -0
  68. valuesets/enums/data_science/binary_classification.py +87 -0
  69. valuesets/enums/data_science/emotion_classification.py +66 -0
  70. valuesets/enums/data_science/priority_severity.py +73 -0
  71. valuesets/enums/data_science/quality_control.py +46 -0
  72. valuesets/enums/data_science/sentiment_analysis.py +50 -0
  73. valuesets/enums/data_science/text_classification.py +97 -0
  74. valuesets/enums/demographics.py +206 -0
  75. valuesets/enums/ecological_interactions.py +151 -0
  76. valuesets/enums/energy/__init__.py +1 -0
  77. valuesets/enums/energy/energy.py +343 -0
  78. valuesets/enums/energy/fossil_fuels.py +29 -0
  79. valuesets/enums/energy/nuclear/__init__.py +1 -0
  80. valuesets/enums/energy/nuclear/nuclear_facilities.py +195 -0
  81. valuesets/enums/energy/nuclear/nuclear_fuel_cycle.py +96 -0
  82. valuesets/enums/energy/nuclear/nuclear_fuels.py +175 -0
  83. valuesets/enums/energy/nuclear/nuclear_operations.py +191 -0
  84. valuesets/enums/energy/nuclear/nuclear_regulatory.py +188 -0
  85. valuesets/enums/energy/nuclear/nuclear_safety.py +164 -0
  86. valuesets/enums/energy/nuclear/nuclear_waste.py +158 -0
  87. valuesets/enums/energy/nuclear/reactor_types.py +163 -0
  88. valuesets/enums/environmental_health/__init__.py +1 -0
  89. valuesets/enums/environmental_health/exposures.py +265 -0
  90. valuesets/enums/geography/__init__.py +1 -0
  91. valuesets/enums/geography/geographic_codes.py +741 -0
  92. valuesets/enums/health/__init__.py +12 -0
  93. valuesets/enums/health/vaccination.py +98 -0
  94. valuesets/enums/health.py +36 -0
  95. valuesets/enums/health_base.py +36 -0
  96. valuesets/enums/healthcare.py +45 -0
  97. valuesets/enums/industry/__init__.py +1 -0
  98. valuesets/enums/industry/extractive_industry.py +94 -0
  99. valuesets/enums/industry/mining.py +388 -0
  100. valuesets/enums/industry/safety_colors.py +201 -0
  101. valuesets/enums/investigation.py +27 -0
  102. valuesets/enums/materials_science/__init__.py +1 -0
  103. valuesets/enums/materials_science/characterization_methods.py +112 -0
  104. valuesets/enums/materials_science/crystal_structures.py +76 -0
  105. valuesets/enums/materials_science/material_properties.py +119 -0
  106. valuesets/enums/materials_science/material_types.py +104 -0
  107. valuesets/enums/materials_science/pigments_dyes.py +198 -0
  108. valuesets/enums/materials_science/synthesis_methods.py +109 -0
  109. valuesets/enums/medical/__init__.py +1 -0
  110. valuesets/enums/medical/clinical.py +277 -0
  111. valuesets/enums/medical/neuroimaging.py +119 -0
  112. valuesets/enums/mining_processing.py +302 -0
  113. valuesets/enums/physics/__init__.py +1 -0
  114. valuesets/enums/physics/states_of_matter.py +46 -0
  115. valuesets/enums/social/__init__.py +1 -0
  116. valuesets/enums/social/person_status.py +29 -0
  117. valuesets/enums/spatial/__init__.py +1 -0
  118. valuesets/enums/spatial/spatial_qualifiers.py +246 -0
  119. valuesets/enums/statistics/__init__.py +5 -0
  120. valuesets/enums/statistics/prediction_outcomes.py +31 -0
  121. valuesets/enums/statistics.py +31 -0
  122. valuesets/enums/time/__init__.py +1 -0
  123. valuesets/enums/time/temporal.py +254 -0
  124. valuesets/enums/units/__init__.py +1 -0
  125. valuesets/enums/units/measurements.py +310 -0
  126. valuesets/enums/visual/__init__.py +1 -0
  127. valuesets/enums/visual/colors.py +376 -0
  128. valuesets/generators/__init__.py +19 -0
  129. valuesets/generators/auto_slot_injector.py +280 -0
  130. valuesets/generators/enhanced_pydantic_generator.py +100 -0
  131. valuesets/generators/enum_slot_generator.py +201 -0
  132. valuesets/generators/modular_rich_generator.py +353 -0
  133. valuesets/generators/prefix_standardizer.py +198 -0
  134. valuesets/generators/rich_enum.py +127 -0
  135. valuesets/generators/rich_pydantic_generator.py +310 -0
  136. valuesets/generators/smart_slot_syncer.py +428 -0
  137. valuesets/generators/sssom_generator.py +394 -0
  138. valuesets/merged/merged_hierarchy.yaml +21649 -0
  139. valuesets/schema/README.md +3 -0
  140. valuesets/schema/academic/research.yaml +911 -0
  141. valuesets/schema/analytical_chemistry/mass_spectrometry.yaml +206 -0
  142. valuesets/schema/bio/bio_entities.yaml +364 -0
  143. valuesets/schema/bio/biological_colors.yaml +434 -0
  144. valuesets/schema/bio/cell_cycle.yaml +309 -0
  145. valuesets/schema/bio/currency_chemicals.yaml +70 -0
  146. valuesets/schema/bio/developmental_stages.yaml +226 -0
  147. valuesets/schema/bio/genome_features.yaml +342 -0
  148. valuesets/schema/bio/genomics.yaml +101 -0
  149. valuesets/schema/bio/go_aspect.yaml +39 -0
  150. valuesets/schema/bio/go_causality.yaml +119 -0
  151. valuesets/schema/bio/go_evidence.yaml +215 -0
  152. valuesets/schema/bio/insdc_geographic_locations.yaml +911 -0
  153. valuesets/schema/bio/insdc_missing_values.yaml +85 -0
  154. valuesets/schema/bio/lipid_categories.yaml +72 -0
  155. valuesets/schema/bio/plant_biology.yaml +125 -0
  156. valuesets/schema/bio/plant_developmental_stages.yaml +77 -0
  157. valuesets/schema/bio/plant_sex.yaml +108 -0
  158. valuesets/schema/bio/protein_evidence.yaml +63 -0
  159. valuesets/schema/bio/proteomics_standards.yaml +116 -0
  160. valuesets/schema/bio/psi_mi.yaml +400 -0
  161. valuesets/schema/bio/relationship_to_oxygen.yaml +46 -0
  162. valuesets/schema/bio/sequence_alphabets.yaml +1168 -0
  163. valuesets/schema/bio/sequence_chemistry.yaml +477 -0
  164. valuesets/schema/bio/sequencing_platforms.yaml +515 -0
  165. valuesets/schema/bio/structural_biology.yaml +428 -0
  166. valuesets/schema/bio/taxonomy.yaml +453 -0
  167. valuesets/schema/bio/trophic_levels.yaml +118 -0
  168. valuesets/schema/bio/uniprot_species.yaml +1209 -0
  169. valuesets/schema/bio/viral_genome_types.yaml +99 -0
  170. valuesets/schema/bioprocessing/scale_up.yaml +458 -0
  171. valuesets/schema/business/human_resources.yaml +752 -0
  172. valuesets/schema/business/industry_classifications.yaml +448 -0
  173. valuesets/schema/business/management_operations.yaml +602 -0
  174. valuesets/schema/business/organizational_structures.yaml +645 -0
  175. valuesets/schema/business/quality_management.yaml +502 -0
  176. valuesets/schema/business/supply_chain.yaml +688 -0
  177. valuesets/schema/chemistry/chemical_entities.yaml +639 -0
  178. valuesets/schema/chemistry/reaction_directionality.yaml +60 -0
  179. valuesets/schema/chemistry/reactions.yaml +442 -0
  180. valuesets/schema/clinical/nih_demographics.yaml +285 -0
  181. valuesets/schema/clinical/phenopackets.yaml +429 -0
  182. valuesets/schema/computing/file_formats.yaml +631 -0
  183. valuesets/schema/computing/maturity_levels.yaml +229 -0
  184. valuesets/schema/computing/mime_types.yaml +266 -0
  185. valuesets/schema/confidence_levels.yaml +206 -0
  186. valuesets/schema/contributor.yaml +30 -0
  187. valuesets/schema/core.yaml +55 -0
  188. valuesets/schema/data/data_absent_reason.yaml +82 -0
  189. valuesets/schema/data_science/binary_classification.yaml +125 -0
  190. valuesets/schema/data_science/emotion_classification.yaml +109 -0
  191. valuesets/schema/data_science/priority_severity.yaml +122 -0
  192. valuesets/schema/data_science/quality_control.yaml +68 -0
  193. valuesets/schema/data_science/sentiment_analysis.yaml +81 -0
  194. valuesets/schema/data_science/text_classification.yaml +135 -0
  195. valuesets/schema/demographics.yaml +238 -0
  196. valuesets/schema/ecological_interactions.yaml +298 -0
  197. valuesets/schema/energy/energy.yaml +595 -0
  198. valuesets/schema/energy/fossil_fuels.yaml +28 -0
  199. valuesets/schema/energy/nuclear/nuclear_facilities.yaml +463 -0
  200. valuesets/schema/energy/nuclear/nuclear_fuel_cycle.yaml +82 -0
  201. valuesets/schema/energy/nuclear/nuclear_fuels.yaml +421 -0
  202. valuesets/schema/energy/nuclear/nuclear_operations.yaml +480 -0
  203. valuesets/schema/energy/nuclear/nuclear_regulatory.yaml +200 -0
  204. valuesets/schema/energy/nuclear/nuclear_safety.yaml +352 -0
  205. valuesets/schema/energy/nuclear/nuclear_waste.yaml +332 -0
  206. valuesets/schema/energy/nuclear/reactor_types.yaml +394 -0
  207. valuesets/schema/environmental_health/exposures.yaml +355 -0
  208. valuesets/schema/generated_slots.yaml +1828 -0
  209. valuesets/schema/geography/geographic_codes.yaml +1018 -0
  210. valuesets/schema/health/vaccination.yaml +102 -0
  211. valuesets/schema/health.yaml +38 -0
  212. valuesets/schema/healthcare.yaml +53 -0
  213. valuesets/schema/industry/extractive_industry.yaml +89 -0
  214. valuesets/schema/industry/mining.yaml +888 -0
  215. valuesets/schema/industry/safety_colors.yaml +375 -0
  216. valuesets/schema/investigation.yaml +64 -0
  217. valuesets/schema/materials_science/characterization_methods.yaml +193 -0
  218. valuesets/schema/materials_science/crystal_structures.yaml +138 -0
  219. valuesets/schema/materials_science/material_properties.yaml +135 -0
  220. valuesets/schema/materials_science/material_types.yaml +151 -0
  221. valuesets/schema/materials_science/pigments_dyes.yaml +465 -0
  222. valuesets/schema/materials_science/synthesis_methods.yaml +186 -0
  223. valuesets/schema/medical/clinical.yaml +610 -0
  224. valuesets/schema/medical/neuroimaging.yaml +325 -0
  225. valuesets/schema/mining_processing.yaml +295 -0
  226. valuesets/schema/physics/states_of_matter.yaml +46 -0
  227. valuesets/schema/slot_mixins.yaml +143 -0
  228. valuesets/schema/social/person_status.yaml +28 -0
  229. valuesets/schema/spatial/spatial_qualifiers.yaml +466 -0
  230. valuesets/schema/statistics/prediction_outcomes.yaml +26 -0
  231. valuesets/schema/statistics.yaml +34 -0
  232. valuesets/schema/time/temporal.yaml +435 -0
  233. valuesets/schema/types.yaml +15 -0
  234. valuesets/schema/units/measurements.yaml +675 -0
  235. valuesets/schema/valuesets.yaml +100 -0
  236. valuesets/schema/visual/colors.yaml +778 -0
  237. valuesets/utils/__init__.py +6 -0
  238. valuesets/utils/comparison.py +102 -0
  239. valuesets/utils/expand_dynamic_enums.py +414 -0
  240. valuesets/utils/mapping_utils.py +236 -0
  241. valuesets/validators/__init__.py +11 -0
  242. valuesets/validators/enum_evaluator.py +669 -0
  243. valuesets/validators/oak_config.yaml +70 -0
  244. valuesets/validators/validate_with_ols.py +241 -0
  245. valuesets-0.3.1.dist-info/METADATA +395 -0
  246. valuesets-0.3.1.dist-info/RECORD +248 -0
  247. valuesets-0.3.1.dist-info/WHEEL +4 -0
  248. valuesets-0.3.1.dist-info/licenses/LICENSE +201 -0
@@ -0,0 +1,1168 @@
1
+ name: sequence_alphabets
2
+ title: Biological Sequence Alphabet Value Sets
3
+ description: 'Alphabets for biological sequences including DNA, RNA, and protein sequences. Includes standard alphabets and
4
+ extended versions with ambiguity codes following IUPAC nomenclature and common bioinformatics standards.
5
+
6
+ '
7
+ id: https://w3id.org/valuesets/bio/sequence_alphabets
8
+ imports:
9
+ - linkml:types
10
+ prefixes:
11
+ linkml: https://w3id.org/linkml/
12
+ SO: http://purl.obolibrary.org/obo/SO_
13
+ CHEBI: http://purl.obolibrary.org/obo/CHEBI_
14
+ EDAM: http://edamontology.org/
15
+ GENO: http://purl.obolibrary.org/obo/GENO_
16
+ valuesets: https://w3id.org/valuesets/
17
+ default_prefix: valuesets
18
+ slots:
19
+ dna_base:
20
+ description: Standard DNA nucleotide bases (canonical)
21
+ range: DNABaseEnum
22
+ dna_base_extended:
23
+ description: Extended DNA alphabet with IUPAC ambiguity codes
24
+ range: DNABaseExtendedEnum
25
+ rna_base:
26
+ description: Standard RNA nucleotide bases (canonical)
27
+ range: RNABaseEnum
28
+ rna_base_extended:
29
+ description: Extended RNA alphabet with IUPAC ambiguity codes
30
+ range: RNABaseExtendedEnum
31
+ amino_acid:
32
+ description: Standard amino acid single letter codes
33
+ range: AminoAcidEnum
34
+ amino_acid_extended:
35
+ description: Extended amino acid alphabet with ambiguity codes and special characters
36
+ range: AminoAcidExtendedEnum
37
+ codon:
38
+ description: Standard genetic code codons (DNA)
39
+ range: CodonEnum
40
+ nucleotide_modification:
41
+ description: Common nucleotide modifications
42
+ range: NucleotideModificationEnum
43
+ sequence_quality:
44
+ description: Sequence quality indicators (Phred scores)
45
+ range: SequenceQualityEnum
46
+ enums:
47
+ DNABaseEnum:
48
+ description: Standard DNA nucleotide bases (canonical)
49
+ permissible_values:
50
+ A:
51
+ title: Adenine
52
+ aliases:
53
+ - adenine
54
+ meaning: CHEBI:16708
55
+ annotations:
56
+ complement: T
57
+ purine: 'true'
58
+ chemical_formula: C5H5N5
59
+ C:
60
+ title: Cytosine
61
+ aliases:
62
+ - cytosine
63
+ meaning: CHEBI:16040
64
+ annotations:
65
+ complement: G
66
+ pyrimidine: 'true'
67
+ chemical_formula: C4H5N3O
68
+ G:
69
+ title: Guanine
70
+ aliases:
71
+ - guanine
72
+ meaning: CHEBI:16235
73
+ annotations:
74
+ complement: C
75
+ purine: 'true'
76
+ chemical_formula: C5H5N5O
77
+ T:
78
+ title: Thymine
79
+ aliases:
80
+ - thymine
81
+ meaning: CHEBI:17821
82
+ annotations:
83
+ complement: A
84
+ pyrimidine: 'true'
85
+ chemical_formula: C5H6N2O2
86
+ DNABaseExtendedEnum:
87
+ description: Extended DNA alphabet with IUPAC ambiguity codes
88
+ permissible_values:
89
+ A:
90
+ title: Adenine
91
+ aliases:
92
+ - adenine
93
+ meaning: CHEBI:16708
94
+ annotations:
95
+ represents: A
96
+ C:
97
+ title: Cytosine
98
+ aliases:
99
+ - cytosine
100
+ meaning: CHEBI:16040
101
+ annotations:
102
+ represents: C
103
+ G:
104
+ title: Guanine
105
+ aliases:
106
+ - guanine
107
+ meaning: CHEBI:16235
108
+ annotations:
109
+ represents: G
110
+ T:
111
+ title: Thymine
112
+ aliases:
113
+ - thymine
114
+ meaning: CHEBI:17821
115
+ annotations:
116
+ represents: T
117
+ R:
118
+ title: Purine (A or G)
119
+ annotations:
120
+ represents: A,G
121
+ iupac: 'true'
122
+ Y:
123
+ title: Pyrimidine (C or T)
124
+ annotations:
125
+ represents: C,T
126
+ iupac: 'true'
127
+ S:
128
+ title: Strong (G or C)
129
+ annotations:
130
+ represents: G,C
131
+ iupac: 'true'
132
+ bond_strength: strong (3 H-bonds)
133
+ W:
134
+ title: Weak (A or T)
135
+ annotations:
136
+ represents: A,T
137
+ iupac: 'true'
138
+ bond_strength: weak (2 H-bonds)
139
+ K:
140
+ title: Keto (G or T)
141
+ annotations:
142
+ represents: G,T
143
+ iupac: 'true'
144
+ M:
145
+ title: Amino (A or C)
146
+ annotations:
147
+ represents: A,C
148
+ iupac: 'true'
149
+ B:
150
+ title: Not A (C, G, or T)
151
+ annotations:
152
+ represents: C,G,T
153
+ iupac: 'true'
154
+ D:
155
+ title: Not C (A, G, or T)
156
+ annotations:
157
+ represents: A,G,T
158
+ iupac: 'true'
159
+ H:
160
+ title: Not G (A, C, or T)
161
+ annotations:
162
+ represents: A,C,T
163
+ iupac: 'true'
164
+ V:
165
+ title: Not T (A, C, or G)
166
+ annotations:
167
+ represents: A,C,G
168
+ iupac: 'true'
169
+ N:
170
+ title: Any nucleotide (A, C, G, or T)
171
+ annotations:
172
+ represents: A,C,G,T
173
+ iupac: 'true'
174
+ GAP:
175
+ title: Gap character
176
+ annotations:
177
+ symbol: '-'
178
+ represents: gap
179
+ RNABaseEnum:
180
+ description: Standard RNA nucleotide bases (canonical)
181
+ permissible_values:
182
+ A:
183
+ title: Adenine
184
+ aliases:
185
+ - adenine
186
+ meaning: CHEBI:16708
187
+ annotations:
188
+ complement: U
189
+ purine: 'true'
190
+ chemical_formula: C5H5N5
191
+ C:
192
+ title: Cytosine
193
+ aliases:
194
+ - cytosine
195
+ meaning: CHEBI:16040
196
+ annotations:
197
+ complement: G
198
+ pyrimidine: 'true'
199
+ chemical_formula: C4H5N3O
200
+ G:
201
+ title: Guanine
202
+ aliases:
203
+ - guanine
204
+ meaning: CHEBI:16235
205
+ annotations:
206
+ complement: C
207
+ purine: 'true'
208
+ chemical_formula: C5H5N5O
209
+ U:
210
+ title: Uracil
211
+ aliases:
212
+ - uracil
213
+ meaning: CHEBI:17568
214
+ annotations:
215
+ complement: A
216
+ pyrimidine: 'true'
217
+ chemical_formula: C4H4N2O2
218
+ RNABaseExtendedEnum:
219
+ description: Extended RNA alphabet with IUPAC ambiguity codes
220
+ permissible_values:
221
+ A:
222
+ title: Adenine
223
+ aliases:
224
+ - adenine
225
+ meaning: CHEBI:16708
226
+ annotations:
227
+ represents: A
228
+ C:
229
+ title: Cytosine
230
+ aliases:
231
+ - cytosine
232
+ meaning: CHEBI:16040
233
+ annotations:
234
+ represents: C
235
+ G:
236
+ title: Guanine
237
+ aliases:
238
+ - guanine
239
+ meaning: CHEBI:16235
240
+ annotations:
241
+ represents: G
242
+ U:
243
+ title: Uracil
244
+ aliases:
245
+ - uracil
246
+ meaning: CHEBI:17568
247
+ annotations:
248
+ represents: U
249
+ R:
250
+ title: Purine (A or G)
251
+ annotations:
252
+ represents: A,G
253
+ iupac: 'true'
254
+ Y:
255
+ title: Pyrimidine (C or U)
256
+ annotations:
257
+ represents: C,U
258
+ iupac: 'true'
259
+ S:
260
+ title: Strong (G or C)
261
+ annotations:
262
+ represents: G,C
263
+ iupac: 'true'
264
+ W:
265
+ title: Weak (A or U)
266
+ annotations:
267
+ represents: A,U
268
+ iupac: 'true'
269
+ K:
270
+ title: Keto (G or U)
271
+ annotations:
272
+ represents: G,U
273
+ iupac: 'true'
274
+ M:
275
+ title: Amino (A or C)
276
+ annotations:
277
+ represents: A,C
278
+ iupac: 'true'
279
+ B:
280
+ title: Not A (C, G, or U)
281
+ annotations:
282
+ represents: C,G,U
283
+ iupac: 'true'
284
+ D:
285
+ title: Not C (A, G, or U)
286
+ annotations:
287
+ represents: A,G,U
288
+ iupac: 'true'
289
+ H:
290
+ title: Not G (A, C, or U)
291
+ annotations:
292
+ represents: A,C,U
293
+ iupac: 'true'
294
+ V:
295
+ title: Not U (A, C, or G)
296
+ annotations:
297
+ represents: A,C,G
298
+ iupac: 'true'
299
+ N:
300
+ title: Any nucleotide (A, C, G, or U)
301
+ annotations:
302
+ represents: A,C,G,U
303
+ iupac: 'true'
304
+ GAP:
305
+ title: Gap character
306
+ annotations:
307
+ symbol: '-'
308
+ represents: gap
309
+ AminoAcidEnum:
310
+ description: Standard amino acid single letter codes
311
+ permissible_values:
312
+ A:
313
+ title: Alanine
314
+ aliases:
315
+ - alanine
316
+ meaning: CHEBI:16449
317
+ annotations:
318
+ three_letter: Ala
319
+ polarity: nonpolar
320
+ essential: 'false'
321
+ molecular_weight: '89.09'
322
+ C:
323
+ title: Cysteine
324
+ aliases:
325
+ - L-cysteine
326
+ meaning: CHEBI:17561
327
+ annotations:
328
+ three_letter: Cys
329
+ polarity: polar
330
+ essential: 'false'
331
+ molecular_weight: '121.15'
332
+ special: forms disulfide bonds
333
+ D:
334
+ title: Aspartic acid
335
+ aliases:
336
+ - L-aspartic acid
337
+ meaning: CHEBI:17053
338
+ annotations:
339
+ three_letter: Asp
340
+ polarity: acidic
341
+ essential: 'false'
342
+ molecular_weight: '133.10'
343
+ charge: negative
344
+ E:
345
+ title: Glutamic acid
346
+ aliases:
347
+ - L-glutamic acid
348
+ meaning: CHEBI:16015
349
+ annotations:
350
+ three_letter: Glu
351
+ polarity: acidic
352
+ essential: 'false'
353
+ molecular_weight: '147.13'
354
+ charge: negative
355
+ F:
356
+ title: Phenylalanine
357
+ aliases:
358
+ - L-phenylalanine
359
+ meaning: CHEBI:17295
360
+ annotations:
361
+ three_letter: Phe
362
+ polarity: nonpolar
363
+ essential: 'true'
364
+ molecular_weight: '165.19'
365
+ aromatic: 'true'
366
+ G:
367
+ title: Glycine
368
+ aliases:
369
+ - glycine
370
+ meaning: CHEBI:15428
371
+ annotations:
372
+ three_letter: Gly
373
+ polarity: nonpolar
374
+ essential: 'false'
375
+ molecular_weight: '75.07'
376
+ special: smallest, most flexible
377
+ H:
378
+ title: Histidine
379
+ aliases:
380
+ - L-histidine
381
+ meaning: CHEBI:15971
382
+ annotations:
383
+ three_letter: His
384
+ polarity: basic
385
+ essential: 'true'
386
+ molecular_weight: '155.16'
387
+ charge: positive
388
+ I:
389
+ title: Isoleucine
390
+ aliases:
391
+ - L-isoleucine
392
+ meaning: CHEBI:17191
393
+ annotations:
394
+ three_letter: Ile
395
+ polarity: nonpolar
396
+ essential: 'true'
397
+ molecular_weight: '131.17'
398
+ branched: 'true'
399
+ K:
400
+ title: Lysine
401
+ aliases:
402
+ - L-lysine
403
+ meaning: CHEBI:18019
404
+ annotations:
405
+ three_letter: Lys
406
+ polarity: basic
407
+ essential: 'true'
408
+ molecular_weight: '146.19'
409
+ charge: positive
410
+ L:
411
+ title: Leucine
412
+ aliases:
413
+ - L-leucine
414
+ meaning: CHEBI:15603
415
+ annotations:
416
+ three_letter: Leu
417
+ polarity: nonpolar
418
+ essential: 'true'
419
+ molecular_weight: '131.17'
420
+ branched: 'true'
421
+ M:
422
+ title: Methionine
423
+ aliases:
424
+ - L-methionine
425
+ meaning: CHEBI:16643
426
+ annotations:
427
+ three_letter: Met
428
+ polarity: nonpolar
429
+ essential: 'true'
430
+ molecular_weight: '149.21'
431
+ special: start codon
432
+ N:
433
+ title: Asparagine
434
+ aliases:
435
+ - L-asparagine
436
+ meaning: CHEBI:17196
437
+ annotations:
438
+ three_letter: Asn
439
+ polarity: polar
440
+ essential: 'false'
441
+ molecular_weight: '132.12'
442
+ P:
443
+ title: Proline
444
+ aliases:
445
+ - L-proline
446
+ meaning: CHEBI:17203
447
+ annotations:
448
+ three_letter: Pro
449
+ polarity: nonpolar
450
+ essential: 'false'
451
+ molecular_weight: '115.13'
452
+ special: helix breaker, rigid
453
+ Q:
454
+ title: Glutamine
455
+ aliases:
456
+ - L-glutamine
457
+ meaning: CHEBI:18050
458
+ annotations:
459
+ three_letter: Gln
460
+ polarity: polar
461
+ essential: 'false'
462
+ molecular_weight: '146.15'
463
+ R:
464
+ title: Arginine
465
+ aliases:
466
+ - L-arginine
467
+ meaning: CHEBI:16467
468
+ annotations:
469
+ three_letter: Arg
470
+ polarity: basic
471
+ essential: 'false'
472
+ molecular_weight: '174.20'
473
+ charge: positive
474
+ S:
475
+ title: Serine
476
+ aliases:
477
+ - L-serine
478
+ meaning: CHEBI:17115
479
+ annotations:
480
+ three_letter: Ser
481
+ polarity: polar
482
+ essential: 'false'
483
+ molecular_weight: '105.09'
484
+ hydroxyl: 'true'
485
+ T:
486
+ title: Threonine
487
+ aliases:
488
+ - L-threonine
489
+ meaning: CHEBI:16857
490
+ annotations:
491
+ three_letter: Thr
492
+ polarity: polar
493
+ essential: 'true'
494
+ molecular_weight: '119.12'
495
+ hydroxyl: 'true'
496
+ V:
497
+ title: Valine
498
+ aliases:
499
+ - L-valine
500
+ meaning: CHEBI:16414
501
+ annotations:
502
+ three_letter: Val
503
+ polarity: nonpolar
504
+ essential: 'true'
505
+ molecular_weight: '117.15'
506
+ branched: 'true'
507
+ W:
508
+ title: Tryptophan
509
+ aliases:
510
+ - L-tryptophan
511
+ meaning: CHEBI:16828
512
+ annotations:
513
+ three_letter: Trp
514
+ polarity: nonpolar
515
+ essential: 'true'
516
+ molecular_weight: '204.23'
517
+ aromatic: 'true'
518
+ special: largest
519
+ Y:
520
+ title: Tyrosine
521
+ aliases:
522
+ - L-tyrosine
523
+ meaning: CHEBI:17895
524
+ annotations:
525
+ three_letter: Tyr
526
+ polarity: polar
527
+ essential: 'false'
528
+ molecular_weight: '181.19'
529
+ aromatic: 'true'
530
+ hydroxyl: 'true'
531
+ AminoAcidExtendedEnum:
532
+ description: Extended amino acid alphabet with ambiguity codes and special characters
533
+ permissible_values:
534
+ A:
535
+ title: Alanine
536
+ aliases:
537
+ - alanine
538
+ meaning: CHEBI:16449
539
+ annotations:
540
+ three_letter: Ala
541
+ C:
542
+ title: Cysteine
543
+ aliases:
544
+ - L-cysteine
545
+ meaning: CHEBI:17561
546
+ annotations:
547
+ three_letter: Cys
548
+ D:
549
+ title: Aspartic acid
550
+ aliases:
551
+ - L-aspartic acid
552
+ meaning: CHEBI:17053
553
+ annotations:
554
+ three_letter: Asp
555
+ E:
556
+ title: Glutamic acid
557
+ aliases:
558
+ - L-glutamic acid
559
+ meaning: CHEBI:16015
560
+ annotations:
561
+ three_letter: Glu
562
+ F:
563
+ title: Phenylalanine
564
+ aliases:
565
+ - L-phenylalanine
566
+ meaning: CHEBI:17295
567
+ annotations:
568
+ three_letter: Phe
569
+ G:
570
+ title: Glycine
571
+ aliases:
572
+ - glycine
573
+ meaning: CHEBI:15428
574
+ annotations:
575
+ three_letter: Gly
576
+ H:
577
+ title: Histidine
578
+ aliases:
579
+ - L-histidine
580
+ meaning: CHEBI:15971
581
+ annotations:
582
+ three_letter: His
583
+ I:
584
+ title: Isoleucine
585
+ aliases:
586
+ - L-isoleucine
587
+ meaning: CHEBI:17191
588
+ annotations:
589
+ three_letter: Ile
590
+ K:
591
+ title: Lysine
592
+ aliases:
593
+ - L-lysine
594
+ meaning: CHEBI:18019
595
+ annotations:
596
+ three_letter: Lys
597
+ L:
598
+ title: Leucine
599
+ aliases:
600
+ - L-leucine
601
+ meaning: CHEBI:15603
602
+ annotations:
603
+ three_letter: Leu
604
+ M:
605
+ title: Methionine
606
+ aliases:
607
+ - L-methionine
608
+ meaning: CHEBI:16643
609
+ annotations:
610
+ three_letter: Met
611
+ N:
612
+ title: Asparagine
613
+ aliases:
614
+ - L-asparagine
615
+ meaning: CHEBI:17196
616
+ annotations:
617
+ three_letter: Asn
618
+ P:
619
+ title: Proline
620
+ aliases:
621
+ - L-proline
622
+ meaning: CHEBI:17203
623
+ annotations:
624
+ three_letter: Pro
625
+ Q:
626
+ title: Glutamine
627
+ aliases:
628
+ - L-glutamine
629
+ meaning: CHEBI:18050
630
+ annotations:
631
+ three_letter: Gln
632
+ R:
633
+ title: Arginine
634
+ aliases:
635
+ - L-arginine
636
+ meaning: CHEBI:16467
637
+ annotations:
638
+ three_letter: Arg
639
+ S:
640
+ title: Serine
641
+ aliases:
642
+ - L-serine
643
+ meaning: CHEBI:17115
644
+ annotations:
645
+ three_letter: Ser
646
+ T:
647
+ title: Threonine
648
+ aliases:
649
+ - L-threonine
650
+ meaning: CHEBI:16857
651
+ annotations:
652
+ three_letter: Thr
653
+ V:
654
+ title: Valine
655
+ aliases:
656
+ - L-valine
657
+ meaning: CHEBI:16414
658
+ annotations:
659
+ three_letter: Val
660
+ W:
661
+ title: Tryptophan
662
+ aliases:
663
+ - L-tryptophan
664
+ meaning: CHEBI:16828
665
+ annotations:
666
+ three_letter: Trp
667
+ Y:
668
+ title: Tyrosine
669
+ aliases:
670
+ - L-tyrosine
671
+ meaning: CHEBI:17895
672
+ annotations:
673
+ three_letter: Tyr
674
+ B:
675
+ title: Aspartic acid
676
+ aliases:
677
+ - L-aspartic acid or Asparagine (D or N)
678
+ annotations:
679
+ three_letter: Asx
680
+ represents: D,N
681
+ ambiguity: 'true'
682
+ Z:
683
+ title: Glutamic acid
684
+ aliases:
685
+ - L-glutamic acid or Glutamine (E or Q)
686
+ annotations:
687
+ three_letter: Glx
688
+ represents: E,Q
689
+ ambiguity: 'true'
690
+ J:
691
+ title: Leucine
692
+ aliases:
693
+ - L-leucine or Isoleucine (L or I)
694
+ annotations:
695
+ three_letter: Xle
696
+ represents: L,I
697
+ ambiguity: 'true'
698
+ X:
699
+ title: Any amino acid
700
+ annotations:
701
+ three_letter: Xaa
702
+ represents: any
703
+ ambiguity: 'true'
704
+ STOP:
705
+ title: Translation stop/termination
706
+ annotations:
707
+ symbol: '*'
708
+ three_letter: Ter
709
+ represents: stop codon
710
+ GAP:
711
+ title: Gap character
712
+ annotations:
713
+ symbol: '-'
714
+ represents: gap
715
+ U:
716
+ title: Selenocysteine
717
+ aliases:
718
+ - L-selenocysteine
719
+ meaning: CHEBI:16633
720
+ annotations:
721
+ three_letter: Sec
722
+ special: 21st amino acid
723
+ codon: UGA with SECIS element
724
+ O:
725
+ title: Pyrrolysine (22nd amino acid)
726
+ meaning: CHEBI:21860
727
+ aliases:
728
+ - L-pyrrolysine
729
+ annotations:
730
+ three_letter: Pyl
731
+ special: 22nd amino acid
732
+ codon: UAG in certain archaea/bacteria
733
+ CodonEnum:
734
+ description: Standard genetic code codons (DNA)
735
+ permissible_values:
736
+ TTT:
737
+ title: Phenylalanine codon
738
+ annotations:
739
+ amino_acid: F
740
+ amino_acid_name: Phenylalanine
741
+ TTC:
742
+ title: Phenylalanine codon
743
+ annotations:
744
+ amino_acid: F
745
+ amino_acid_name: Phenylalanine
746
+ TTA:
747
+ title: Leucine codon
748
+ annotations:
749
+ amino_acid: L
750
+ amino_acid_name: Leucine
751
+ TTG:
752
+ title: Leucine codon
753
+ annotations:
754
+ amino_acid: L
755
+ amino_acid_name: Leucine
756
+ CTT:
757
+ title: Leucine codon
758
+ annotations:
759
+ amino_acid: L
760
+ amino_acid_name: Leucine
761
+ CTC:
762
+ title: Leucine codon
763
+ annotations:
764
+ amino_acid: L
765
+ amino_acid_name: Leucine
766
+ CTA:
767
+ title: Leucine codon
768
+ annotations:
769
+ amino_acid: L
770
+ amino_acid_name: Leucine
771
+ CTG:
772
+ title: Leucine codon
773
+ annotations:
774
+ amino_acid: L
775
+ amino_acid_name: Leucine
776
+ ATT:
777
+ title: Isoleucine codon
778
+ annotations:
779
+ amino_acid: I
780
+ amino_acid_name: Isoleucine
781
+ ATC:
782
+ title: Isoleucine codon
783
+ annotations:
784
+ amino_acid: I
785
+ amino_acid_name: Isoleucine
786
+ ATA:
787
+ title: Isoleucine codon
788
+ annotations:
789
+ amino_acid: I
790
+ amino_acid_name: Isoleucine
791
+ ATG:
792
+ title: Methionine codon (start codon)
793
+ annotations:
794
+ amino_acid: M
795
+ amino_acid_name: Methionine
796
+ special: start codon
797
+ GTT:
798
+ title: Valine codon
799
+ annotations:
800
+ amino_acid: V
801
+ amino_acid_name: Valine
802
+ GTC:
803
+ title: Valine codon
804
+ annotations:
805
+ amino_acid: V
806
+ amino_acid_name: Valine
807
+ GTA:
808
+ title: Valine codon
809
+ annotations:
810
+ amino_acid: V
811
+ amino_acid_name: Valine
812
+ GTG:
813
+ title: Valine codon
814
+ annotations:
815
+ amino_acid: V
816
+ amino_acid_name: Valine
817
+ TCT:
818
+ title: Serine codon
819
+ annotations:
820
+ amino_acid: S
821
+ amino_acid_name: Serine
822
+ TCC:
823
+ title: Serine codon
824
+ annotations:
825
+ amino_acid: S
826
+ amino_acid_name: Serine
827
+ TCA:
828
+ title: Serine codon
829
+ annotations:
830
+ amino_acid: S
831
+ amino_acid_name: Serine
832
+ TCG:
833
+ title: Serine codon
834
+ annotations:
835
+ amino_acid: S
836
+ amino_acid_name: Serine
837
+ AGT:
838
+ title: Serine codon
839
+ annotations:
840
+ amino_acid: S
841
+ amino_acid_name: Serine
842
+ AGC:
843
+ title: Serine codon
844
+ annotations:
845
+ amino_acid: S
846
+ amino_acid_name: Serine
847
+ CCT:
848
+ title: Proline codon
849
+ annotations:
850
+ amino_acid: P
851
+ amino_acid_name: Proline
852
+ CCC:
853
+ title: Proline codon
854
+ annotations:
855
+ amino_acid: P
856
+ amino_acid_name: Proline
857
+ CCA:
858
+ title: Proline codon
859
+ annotations:
860
+ amino_acid: P
861
+ amino_acid_name: Proline
862
+ CCG:
863
+ title: Proline codon
864
+ annotations:
865
+ amino_acid: P
866
+ amino_acid_name: Proline
867
+ ACT:
868
+ title: Threonine codon
869
+ annotations:
870
+ amino_acid: T
871
+ amino_acid_name: Threonine
872
+ ACC:
873
+ title: Threonine codon
874
+ annotations:
875
+ amino_acid: T
876
+ amino_acid_name: Threonine
877
+ ACA:
878
+ title: Threonine codon
879
+ annotations:
880
+ amino_acid: T
881
+ amino_acid_name: Threonine
882
+ ACG:
883
+ title: Threonine codon
884
+ annotations:
885
+ amino_acid: T
886
+ amino_acid_name: Threonine
887
+ GCT:
888
+ title: Alanine codon
889
+ annotations:
890
+ amino_acid: A
891
+ amino_acid_name: Alanine
892
+ GCC:
893
+ title: Alanine codon
894
+ annotations:
895
+ amino_acid: A
896
+ amino_acid_name: Alanine
897
+ GCA:
898
+ title: Alanine codon
899
+ annotations:
900
+ amino_acid: A
901
+ amino_acid_name: Alanine
902
+ GCG:
903
+ title: Alanine codon
904
+ annotations:
905
+ amino_acid: A
906
+ amino_acid_name: Alanine
907
+ TAT:
908
+ title: Tyrosine codon
909
+ annotations:
910
+ amino_acid: Y
911
+ amino_acid_name: Tyrosine
912
+ TAC:
913
+ title: Tyrosine codon
914
+ annotations:
915
+ amino_acid: Y
916
+ amino_acid_name: Tyrosine
917
+ TAA:
918
+ title: Stop codon (ochre)
919
+ annotations:
920
+ amino_acid: '*'
921
+ name: ochre
922
+ special: stop codon
923
+ TAG:
924
+ title: Stop codon (amber)
925
+ annotations:
926
+ amino_acid: '*'
927
+ name: amber
928
+ special: stop codon
929
+ TGA:
930
+ title: Stop codon (opal/umber)
931
+ annotations:
932
+ amino_acid: '*'
933
+ name: opal
934
+ special: stop codon or selenocysteine
935
+ CAT:
936
+ title: Histidine codon
937
+ annotations:
938
+ amino_acid: H
939
+ amino_acid_name: Histidine
940
+ CAC:
941
+ title: Histidine codon
942
+ annotations:
943
+ amino_acid: H
944
+ amino_acid_name: Histidine
945
+ CAA:
946
+ title: Glutamine codon
947
+ annotations:
948
+ amino_acid: Q
949
+ amino_acid_name: Glutamine
950
+ CAG:
951
+ title: Glutamine codon
952
+ annotations:
953
+ amino_acid: Q
954
+ amino_acid_name: Glutamine
955
+ AAT:
956
+ title: Asparagine codon
957
+ annotations:
958
+ amino_acid: N
959
+ amino_acid_name: Asparagine
960
+ AAC:
961
+ title: Asparagine codon
962
+ annotations:
963
+ amino_acid: N
964
+ amino_acid_name: Asparagine
965
+ AAA:
966
+ title: Lysine codon
967
+ annotations:
968
+ amino_acid: K
969
+ amino_acid_name: Lysine
970
+ AAG:
971
+ title: Lysine codon
972
+ annotations:
973
+ amino_acid: K
974
+ amino_acid_name: Lysine
975
+ GAT:
976
+ title: Aspartic acid codon
977
+ annotations:
978
+ amino_acid: D
979
+ amino_acid_name: Aspartic acid
980
+ GAC:
981
+ title: Aspartic acid codon
982
+ annotations:
983
+ amino_acid: D
984
+ amino_acid_name: Aspartic acid
985
+ GAA:
986
+ title: Glutamic acid codon
987
+ annotations:
988
+ amino_acid: E
989
+ amino_acid_name: Glutamic acid
990
+ GAG:
991
+ title: Glutamic acid codon
992
+ annotations:
993
+ amino_acid: E
994
+ amino_acid_name: Glutamic acid
995
+ TGT:
996
+ title: Cysteine codon
997
+ annotations:
998
+ amino_acid: C
999
+ amino_acid_name: Cysteine
1000
+ TGC:
1001
+ title: Cysteine codon
1002
+ annotations:
1003
+ amino_acid: C
1004
+ amino_acid_name: Cysteine
1005
+ TGG:
1006
+ title: Tryptophan codon
1007
+ annotations:
1008
+ amino_acid: W
1009
+ amino_acid_name: Tryptophan
1010
+ CGT:
1011
+ title: Arginine codon
1012
+ annotations:
1013
+ amino_acid: R
1014
+ amino_acid_name: Arginine
1015
+ CGC:
1016
+ title: Arginine codon
1017
+ annotations:
1018
+ amino_acid: R
1019
+ amino_acid_name: Arginine
1020
+ CGA:
1021
+ title: Arginine codon
1022
+ annotations:
1023
+ amino_acid: R
1024
+ amino_acid_name: Arginine
1025
+ CGG:
1026
+ title: Arginine codon
1027
+ annotations:
1028
+ amino_acid: R
1029
+ amino_acid_name: Arginine
1030
+ AGA:
1031
+ title: Arginine codon
1032
+ annotations:
1033
+ amino_acid: R
1034
+ amino_acid_name: Arginine
1035
+ AGG:
1036
+ title: Arginine codon
1037
+ annotations:
1038
+ amino_acid: R
1039
+ amino_acid_name: Arginine
1040
+ GGT:
1041
+ title: Glycine codon
1042
+ annotations:
1043
+ amino_acid: G
1044
+ amino_acid_name: Glycine
1045
+ GGC:
1046
+ title: Glycine codon
1047
+ annotations:
1048
+ amino_acid: G
1049
+ amino_acid_name: Glycine
1050
+ GGA:
1051
+ title: Glycine codon
1052
+ annotations:
1053
+ amino_acid: G
1054
+ amino_acid_name: Glycine
1055
+ GGG:
1056
+ title: Glycine codon
1057
+ annotations:
1058
+ amino_acid: G
1059
+ amino_acid_name: Glycine
1060
+ NucleotideModificationEnum:
1061
+ description: Common nucleotide modifications
1062
+ permissible_values:
1063
+ FIVE_METHYL_C:
1064
+ title: 5-methylcytosine
1065
+ description: 5-methylcytosine
1066
+ meaning: CHEBI:27551
1067
+ annotations:
1068
+ symbol: m5C
1069
+ type: DNA methylation
1070
+ function: gene regulation
1071
+ SIX_METHYL_A:
1072
+ title: N(6)-methyladenosine
1073
+ description: N6-methyladenosine
1074
+ meaning: CHEBI:21891
1075
+ annotations:
1076
+ symbol: m6A
1077
+ type: RNA modification
1078
+ function: RNA stability, translation
1079
+ PSEUDOURIDINE:
1080
+ description: Pseudouridine
1081
+ meaning: CHEBI:17802
1082
+ annotations:
1083
+ symbol: Ψ
1084
+ type: RNA modification
1085
+ function: RNA stability
1086
+ INOSINE:
1087
+ description: Inosine
1088
+ meaning: CHEBI:17596
1089
+ annotations:
1090
+ symbol: I
1091
+ type: RNA editing
1092
+ pairs_with: A, C, U
1093
+ DIHYDROURIDINE:
1094
+ title: dihydrouridine
1095
+ description: Dihydrouridine
1096
+ meaning: CHEBI:23774
1097
+ annotations:
1098
+ symbol: D
1099
+ type: tRNA modification
1100
+ SEVEN_METHYL_G:
1101
+ title: 7-methylguanosine
1102
+ description: 7-methylguanosine
1103
+ meaning: CHEBI:20794
1104
+ annotations:
1105
+ symbol: m7G
1106
+ type: mRNA cap
1107
+ function: translation initiation
1108
+ FIVE_HYDROXY_METHYL_C:
1109
+ title: 5-(hydroxymethyl)cytosine
1110
+ description: 5-hydroxymethylcytosine
1111
+ meaning: CHEBI:76792
1112
+ annotations:
1113
+ symbol: hmC
1114
+ type: DNA modification
1115
+ function: demethylation intermediate
1116
+ EIGHT_OXO_G:
1117
+ title: 8-oxoguanine
1118
+ description: 8-oxoguanine
1119
+ meaning: CHEBI:44605
1120
+ annotations:
1121
+ symbol: 8-oxoG
1122
+ type: oxidative damage
1123
+ pairs_with: A or C
1124
+ SequenceQualityEnum:
1125
+ description: Sequence quality indicators (Phred scores)
1126
+ permissible_values:
1127
+ Q0:
1128
+ description: Phred quality 0 (100% error probability)
1129
+ annotations:
1130
+ phred_score: '0'
1131
+ error_probability: '1.0'
1132
+ ascii_char: '!'
1133
+ Q10:
1134
+ description: Phred quality 10 (10% error probability)
1135
+ annotations:
1136
+ phred_score: '10'
1137
+ error_probability: '0.1'
1138
+ ascii_char: +
1139
+ Q20:
1140
+ description: Phred quality 20 (1% error probability)
1141
+ annotations:
1142
+ phred_score: '20'
1143
+ error_probability: '0.01'
1144
+ ascii_char: '5'
1145
+ Q30:
1146
+ description: Phred quality 30 (0.1% error probability)
1147
+ annotations:
1148
+ phred_score: '30'
1149
+ error_probability: '0.001'
1150
+ ascii_char: '?'
1151
+ Q40:
1152
+ description: Phred quality 40 (0.01% error probability)
1153
+ annotations:
1154
+ phred_score: '40'
1155
+ error_probability: '0.0001'
1156
+ ascii_char: I
1157
+ Q50:
1158
+ description: Phred quality 50 (0.001% error probability)
1159
+ annotations:
1160
+ phred_score: '50'
1161
+ error_probability: '0.00001'
1162
+ ascii_char: S
1163
+ Q60:
1164
+ description: Phred quality 60 (0.0001% error probability)
1165
+ annotations:
1166
+ phred_score: '60'
1167
+ error_probability: '0.000001'
1168
+ ascii_char: ']'