RNApolis 0.4.13__tar.gz → 0.4.15__tar.gz
Sign up to get free protection for your applications and to get access to all the features.
- {rnapolis-0.4.13/src/RNApolis.egg-info → rnapolis-0.4.15}/PKG-INFO +11 -2
- {rnapolis-0.4.13 → rnapolis-0.4.15}/setup.py +1 -1
- {rnapolis-0.4.13 → rnapolis-0.4.15/src/RNApolis.egg-info}/PKG-INFO +11 -2
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/annotator.py +2 -1
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/molecule_filter.py +16 -2
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/parser.py +13 -2
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_molecule_filter.py +6 -4
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_parser.py +19 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/LICENSE +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/README.md +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/pyproject.toml +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/setup.cfg +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/RNApolis.egg-info/SOURCES.txt +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/RNApolis.egg-info/dependency_links.txt +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/RNApolis.egg-info/entry_points.txt +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/RNApolis.egg-info/requires.txt +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/RNApolis.egg-info/top_level.txt +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/clashfinder.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/common.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/metareader.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/motif_extractor.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/rfam_folder.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/tertiary.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/transformer.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/src/rnapolis/util.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_annotator.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_bugfixes.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_common.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_metareader.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_quadruplexes.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_rfam_folder.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_tertiary.py +0 -0
- {rnapolis-0.4.13 → rnapolis-0.4.15}/tests/test_transformer.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
|
-
Metadata-Version: 2.
|
1
|
+
Metadata-Version: 2.2
|
2
2
|
Name: RNApolis
|
3
|
-
Version: 0.4.
|
3
|
+
Version: 0.4.15
|
4
4
|
Summary: A Python library containing RNA-related bioinformatics functions and classes
|
5
5
|
Home-page: https://github.com/tzok/rnapolis-py
|
6
6
|
Author: Tomasz Zok
|
@@ -26,6 +26,15 @@ Requires-Dist: pulp
|
|
26
26
|
Requires-Dist: requests
|
27
27
|
Requires-Dist: scipy
|
28
28
|
Requires-Dist: viennarna
|
29
|
+
Dynamic: author
|
30
|
+
Dynamic: author-email
|
31
|
+
Dynamic: classifier
|
32
|
+
Dynamic: description
|
33
|
+
Dynamic: description-content-type
|
34
|
+
Dynamic: home-page
|
35
|
+
Dynamic: project-url
|
36
|
+
Dynamic: requires-dist
|
37
|
+
Dynamic: summary
|
29
38
|
|
30
39
|
# RNApolis
|
31
40
|
|
@@ -1,6 +1,6 @@
|
|
1
|
-
Metadata-Version: 2.
|
1
|
+
Metadata-Version: 2.2
|
2
2
|
Name: RNApolis
|
3
|
-
Version: 0.4.
|
3
|
+
Version: 0.4.15
|
4
4
|
Summary: A Python library containing RNA-related bioinformatics functions and classes
|
5
5
|
Home-page: https://github.com/tzok/rnapolis-py
|
6
6
|
Author: Tomasz Zok
|
@@ -26,6 +26,15 @@ Requires-Dist: pulp
|
|
26
26
|
Requires-Dist: requests
|
27
27
|
Requires-Dist: scipy
|
28
28
|
Requires-Dist: viennarna
|
29
|
+
Dynamic: author
|
30
|
+
Dynamic: author-email
|
31
|
+
Dynamic: classifier
|
32
|
+
Dynamic: description
|
33
|
+
Dynamic: description-content-type
|
34
|
+
Dynamic: home-page
|
35
|
+
Dynamic: project-url
|
36
|
+
Dynamic: requires-dist
|
37
|
+
Dynamic: summary
|
29
38
|
|
30
39
|
# RNApolis
|
31
40
|
|
@@ -11,6 +11,8 @@ import numpy
|
|
11
11
|
import numpy.typing
|
12
12
|
import orjson
|
13
13
|
from ordered_set import OrderedSet
|
14
|
+
from scipy.spatial import KDTree
|
15
|
+
|
14
16
|
from rnapolis.common import (
|
15
17
|
BR,
|
16
18
|
BaseInteractions,
|
@@ -42,7 +44,6 @@ from rnapolis.tertiary import (
|
|
42
44
|
torsion_angle,
|
43
45
|
)
|
44
46
|
from rnapolis.util import handle_input_file
|
45
|
-
from scipy.spatial import KDTree
|
46
47
|
|
47
48
|
HYDROGEN_BOND_MAX_DISTANCE = 4.0
|
48
49
|
HYDROGEN_BOND_ANGLE_RANGE = (50.0, 130.0) # 90 degrees is ideal, so allow +- 40 degrees
|
@@ -156,7 +156,9 @@ def select_category_by_id(
|
|
156
156
|
|
157
157
|
|
158
158
|
def filter_by_poly_types(
|
159
|
-
file_content: str,
|
159
|
+
file_content: str,
|
160
|
+
entity_poly_types: Iterable[str] = ["polyribonucleotide"],
|
161
|
+
retain_categories: Iterable[str] = [],
|
160
162
|
) -> str:
|
161
163
|
adapter = IoAdapterPy()
|
162
164
|
|
@@ -187,13 +189,20 @@ def filter_by_poly_types(
|
|
187
189
|
obj = DataCategory(category, attributes, rows)
|
188
190
|
output.append(obj)
|
189
191
|
|
192
|
+
for category in retain_categories:
|
193
|
+
obj = data[0].getObj(category)
|
194
|
+
if obj:
|
195
|
+
output.append(obj)
|
196
|
+
|
190
197
|
with tempfile.NamedTemporaryFile("rt+") as tmp:
|
191
198
|
adapter.writeFile(tmp.name, [output])
|
192
199
|
tmp.seek(0)
|
193
200
|
return tmp.read()
|
194
201
|
|
195
202
|
|
196
|
-
def filter_by_chains(
|
203
|
+
def filter_by_chains(
|
204
|
+
file_content: str, chains: Iterable[str], retain_categories: Iterable[str] = []
|
205
|
+
) -> str:
|
197
206
|
"""
|
198
207
|
Filter a PDBx/mmCIF file by chain IDs. The function returns a new PDBx/mmCIF file.
|
199
208
|
|
@@ -228,6 +237,11 @@ def filter_by_chains(file_content: str, chains: Iterable[str]) -> str:
|
|
228
237
|
obj = DataCategory(category, attributes, rows)
|
229
238
|
output.append(obj)
|
230
239
|
|
240
|
+
for category in retain_categories:
|
241
|
+
obj = data[0].getObj(category)
|
242
|
+
if obj:
|
243
|
+
output.append(obj)
|
244
|
+
|
231
245
|
with tempfile.NamedTemporaryFile("rt+") as tmp:
|
232
246
|
adapter.writeFile(tmp.name, [output])
|
233
247
|
tmp.seek(0)
|
@@ -218,7 +218,9 @@ def parse_cif(
|
|
218
218
|
)
|
219
219
|
|
220
220
|
if entity_id and pdbx_seq_one_letter_code_can:
|
221
|
-
sequence_by_entity[entity_id] =
|
221
|
+
sequence_by_entity[entity_id] = (
|
222
|
+
pdbx_seq_one_letter_code_can.replace("\n", "")
|
223
|
+
)
|
222
224
|
|
223
225
|
if entity:
|
224
226
|
for row in entity.getRowList():
|
@@ -234,7 +236,16 @@ def parse_cif(
|
|
234
236
|
|
235
237
|
if type_:
|
236
238
|
is_nucleic_acid_by_entity[entity_id] = (
|
237
|
-
is_nucleic_acid_by_entity.get(
|
239
|
+
is_nucleic_acid_by_entity.get(
|
240
|
+
entity_id,
|
241
|
+
type_
|
242
|
+
in (
|
243
|
+
"peptide nucleic acid",
|
244
|
+
"polydeoxyribonucleotide",
|
245
|
+
"polydeoxyribonucleotide/polyribonucleotide hybrid",
|
246
|
+
"polyribonucleotide",
|
247
|
+
),
|
248
|
+
)
|
238
249
|
)
|
239
250
|
|
240
251
|
atoms = filter_clashing_atoms(atoms_to_process)
|
@@ -9,8 +9,9 @@ def test_filter_by_poly_types():
|
|
9
9
|
with open("tests/1a9n.cif") as f:
|
10
10
|
content = f.read()
|
11
11
|
|
12
|
-
filtered = filter_by_poly_types(content, ["polyribonucleotide"])
|
13
|
-
assert re.search(r"^_entity
|
12
|
+
filtered = filter_by_poly_types(content, ["polyribonucleotide"], ["chem_comp"])
|
13
|
+
assert re.search(r"^_entity\.id", filtered, re.MULTILINE) is not None
|
14
|
+
assert re.search(r"^_chem_comp\.id", filtered, re.MULTILINE) is not None
|
14
15
|
|
15
16
|
with tempfile.NamedTemporaryFile("rt+") as f:
|
16
17
|
f.write(filtered)
|
@@ -25,8 +26,9 @@ def test_filter_by_chains():
|
|
25
26
|
with open("tests/1a9n.cif") as f:
|
26
27
|
content = f.read()
|
27
28
|
|
28
|
-
filtered = filter_by_chains(content, ["A", "C"])
|
29
|
-
assert re.search(r"^_entity
|
29
|
+
filtered = filter_by_chains(content, ["A", "C"], ["chem_comp"])
|
30
|
+
assert re.search(r"^_entity\.id", filtered, re.MULTILINE) is not None
|
31
|
+
assert re.search(r"^_chem_comp\.id", filtered, re.MULTILINE) is not None
|
30
32
|
|
31
33
|
with tempfile.NamedTemporaryFile("rt+") as f:
|
32
34
|
f.write(filtered)
|
@@ -1,3 +1,5 @@
|
|
1
|
+
import gzip
|
2
|
+
|
1
3
|
from rnapolis.parser import read_3d_structure
|
2
4
|
|
3
5
|
|
@@ -31,3 +33,20 @@ def test_4qln_no_duplicate_atoms():
|
|
31
33
|
assert len(atom_names) == len(
|
32
34
|
set(atom_names)
|
33
35
|
), f"Duplicate atoms found in residue {residue.auth}"
|
36
|
+
|
37
|
+
|
38
|
+
def test_1gid():
|
39
|
+
expected_sequence = "GAAUUGCGGGAAAGGGGUCAACAGCCGUUCAGUACCAAGUCUCAGGGGAAACUUUGAGAUGGCCUUGCAAAGGGUAUGGUAAUAAGCUGACGGACAUGGUCCUAACCACGCAGCCAAGUCCUAAGUCAACAGAUCUUCUGUUGAUAUGGAUGCAGUUC"
|
40
|
+
|
41
|
+
with gzip.open("tests/1gid.cif.gz", "rt") as f:
|
42
|
+
structure3d = read_3d_structure(f, nucleic_acid_only=True)
|
43
|
+
|
44
|
+
residues_a = [r for r in structure3d.residues if r.auth.chain == "A"]
|
45
|
+
residues_b = [r for r in structure3d.residues if r.auth.chain == "B"]
|
46
|
+
assert len(residues_a) == len(expected_sequence)
|
47
|
+
assert len(residues_b) == len(expected_sequence)
|
48
|
+
|
49
|
+
actual_sequence_a = "".join([residue.one_letter_name for residue in residues_a])
|
50
|
+
actual_sequence_b = "".join([residue.one_letter_name for residue in residues_b])
|
51
|
+
assert actual_sequence_a == expected_sequence
|
52
|
+
assert actual_sequence_b == expected_sequence
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|