@datagrok/bio 2.4.31 → 2.4.40
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.eslintrc.json +6 -8
- package/README.md +22 -7
- package/css/msa.css +3 -0
- package/detectors.js +21 -12
- package/dist/1.js +2 -0
- package/dist/1.js.map +1 -0
- package/dist/18.js +2 -0
- package/dist/18.js.map +1 -0
- package/dist/190.js +2 -0
- package/dist/190.js.map +1 -0
- package/dist/452.js +2 -0
- package/dist/452.js.map +1 -0
- package/dist/729.js +2 -0
- package/dist/729.js.map +1 -0
- package/dist/package-test.js +1 -1
- package/dist/package-test.js.map +1 -1
- package/dist/package.js +1 -1
- package/dist/package.js.map +1 -1
- package/files/libraries/broken-lib.sdf +136 -0
- package/files/libraries/group1/mock-lib-3.json +74 -0
- package/files/libraries/mock-lib-2.json +48 -0
- package/files/tests/100_3_clustests.csv +100 -0
- package/files/tests/100_3_clustests_empty_vals.csv +100 -0
- package/files/tests/peptides_motif-with-random_10000.csv +9998 -0
- package/package.json +4 -4
- package/scripts/sequence_generator.py +164 -48
- package/src/analysis/sequence-activity-cliffs.ts +7 -9
- package/src/analysis/sequence-diversity-viewer.ts +8 -3
- package/src/analysis/sequence-search-base-viewer.ts +4 -3
- package/src/analysis/sequence-similarity-viewer.ts +13 -7
- package/src/analysis/sequence-space.ts +15 -12
- package/src/analysis/workers/mm-distance-array-service.ts +48 -0
- package/src/analysis/workers/mm-distance-array-worker.ts +29 -0
- package/src/analysis/workers/mm-distance-worker-creator.ts +6 -9
- package/src/apps/web-logo-app.ts +34 -0
- package/src/calculations/monomerLevelMols.ts +10 -12
- package/src/demo/bio01-similarity-diversity.ts +4 -5
- package/src/demo/bio01a-hierarchical-clustering-and-sequence-space.ts +6 -7
- package/src/demo/bio01b-hierarchical-clustering-and-activity-cliffs.ts +7 -8
- package/src/demo/bio03-atomic-level.ts +1 -4
- package/src/demo/bio05-helm-msa-sequence-space.ts +6 -4
- package/src/demo/utils.ts +3 -4
- package/src/package-test.ts +1 -2
- package/src/package.ts +135 -82
- package/src/seq_align.ts +482 -483
- package/src/substructure-search/substructure-search.ts +3 -3
- package/src/tests/Palettes-test.ts +1 -1
- package/src/tests/WebLogo-positions-test.ts +12 -35
- package/src/tests/_first-tests.ts +1 -1
- package/src/tests/activity-cliffs-tests.ts +10 -7
- package/src/tests/activity-cliffs-utils.ts +6 -5
- package/src/tests/bio-tests.ts +20 -25
- package/src/tests/checkInputColumn-tests.ts +5 -11
- package/src/tests/converters-test.ts +19 -37
- package/src/tests/detectors-benchmark-tests.ts +35 -37
- package/src/tests/detectors-tests.ts +29 -34
- package/src/tests/detectors-weak-and-likely-tests.ts +11 -21
- package/src/tests/fasta-export-tests.ts +3 -3
- package/src/tests/fasta-handler-test.ts +2 -3
- package/src/tests/lib-tests.ts +2 -4
- package/src/tests/mm-distance-tests.ts +25 -17
- package/src/tests/monomer-libraries-tests.ts +1 -1
- package/src/tests/msa-tests.ts +12 -9
- package/src/tests/pepsea-tests.ts +6 -3
- package/src/tests/renderers-test.ts +13 -11
- package/src/tests/sequence-space-test.ts +10 -8
- package/src/tests/sequence-space-utils.ts +6 -4
- package/src/tests/similarity-diversity-tests.ts +47 -61
- package/src/tests/splitters-test.ts +14 -20
- package/src/tests/to-atomic-level-tests.ts +9 -17
- package/src/tests/units-handler-splitted-tests.ts +106 -0
- package/src/tests/units-handler-tests.ts +22 -26
- package/src/tests/utils/sequences-generators.ts +6 -2
- package/src/tests/utils.ts +10 -4
- package/src/tests/viewers.ts +1 -1
- package/src/utils/atomic-works.ts +49 -57
- package/src/utils/cell-renderer.ts +25 -8
- package/src/utils/check-input-column.ts +19 -4
- package/src/utils/constants.ts +3 -3
- package/src/utils/convert.ts +56 -23
- package/src/utils/monomer-lib.ts +83 -64
- package/src/utils/multiple-sequence-alignment-ui.ts +35 -21
- package/src/utils/multiple-sequence-alignment.ts +2 -2
- package/src/utils/pepsea.ts +17 -7
- package/src/utils/save-as-fasta.ts +11 -4
- package/src/utils/ui-utils.ts +1 -1
- package/src/viewers/vd-regions-viewer.ts +21 -22
- package/src/viewers/web-logo-viewer.ts +189 -154
- package/src/widgets/bio-substructure-filter.ts +9 -6
- package/src/widgets/representations.ts +11 -12
- package/tsconfig.json +1 -1
- package/dist/258.js +0 -2
- package/dist/258.js.map +0 -1
- package/dist/457.js +0 -2
- package/dist/457.js.map +0 -1
- package/dist/562.js +0 -2
- package/dist/562.js.map +0 -1
- package/dist/925.js +0 -2
- package/dist/925.js.map +0 -1
- package/src/analysis/workers/mm-distance-worker.ts +0 -16
|
@@ -0,0 +1,136 @@
|
|
|
1
|
+
HELM Core Monomer library
|
|
2
|
+
RDKit 2D
|
|
3
|
+
|
|
4
|
+
7 6 0 0 1 0 0 0 0 0999 V2000
|
|
5
|
+
2.0625 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
6
|
+
1.2375 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
7
|
+
0.8250 1.4289 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
8
|
+
1.2375 2.1434 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0
|
|
9
|
+
0.8250 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
10
|
+
1.2375 -0.7145 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0
|
|
11
|
+
0.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
|
12
|
+
2 1 1 1
|
|
13
|
+
2 3 1 0
|
|
14
|
+
3 4 1 0
|
|
15
|
+
2 5 1 0
|
|
16
|
+
5 6 1 0
|
|
17
|
+
5 7 2 0
|
|
18
|
+
M RGP 2 4 1 6 2
|
|
19
|
+
M END
|
|
20
|
+
|
|
21
|
+
> <monomerType>
|
|
22
|
+
Backbone
|
|
23
|
+
|
|
24
|
+
> <author>
|
|
25
|
+
Pistoia Alliance HELM project
|
|
26
|
+
|
|
27
|
+
> <naturalAnalog>
|
|
28
|
+
A
|
|
29
|
+
|
|
30
|
+
> <createDate>
|
|
31
|
+
|
|
32
|
+
|
|
33
|
+
> <id>
|
|
34
|
+
0
|
|
35
|
+
|
|
36
|
+
> <polymerType>
|
|
37
|
+
PEPTIDE
|
|
38
|
+
|
|
39
|
+
> <symbol>
|
|
40
|
+
A
|
|
41
|
+
|
|
42
|
+
$$$$
|
|
43
|
+
HELM Core Monomer library
|
|
44
|
+
Ketcher 10131612512D 1 1.00000 0.00000 0
|
|
45
|
+
|
|
46
|
+
11 12 0 0 0 999 V2000
|
|
47
|
+
0.9632 -3.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
48
|
+
0.0970 -4.0450 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
49
|
+
0.0970 -5.0451 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
50
|
+
0.9630 -5.5451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
51
|
+
1.8291 -5.0452 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
52
|
+
1.8293 -4.0451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
53
|
+
-0.8536 -5.3539 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
54
|
+
-1.4413 -4.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
55
|
+
-0.8535 -3.7357 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
56
|
+
0.9632 -2.5448 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
57
|
+
-1.1626 -6.3051 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
58
|
+
1 10 1 0 0 0
|
|
59
|
+
1 6 2 0 0 0
|
|
60
|
+
1 2 1 0 0 0
|
|
61
|
+
9 2 1 0 0 0
|
|
62
|
+
2 3 2 0 0 0
|
|
63
|
+
7 3 1 0 0 0
|
|
64
|
+
3 4 1 0 0 0
|
|
65
|
+
4 5 2 0 0 0
|
|
66
|
+
5 6 1 0 0 0
|
|
67
|
+
7 8 1 0 0 0
|
|
68
|
+
7 11 1 0 0 0
|
|
69
|
+
8 9 2 0 0 0
|
|
70
|
+
A 11
|
|
71
|
+
R1
|
|
72
|
+
M END
|
|
73
|
+
|
|
74
|
+
> <monomerType>
|
|
75
|
+
Branch
|
|
76
|
+
|
|
77
|
+
> <author>
|
|
78
|
+
Pistoia Alliance HELM project
|
|
79
|
+
|
|
80
|
+
> <naturalAnalog>
|
|
81
|
+
A
|
|
82
|
+
|
|
83
|
+
> <createDate>
|
|
84
|
+
|
|
85
|
+
|
|
86
|
+
> <id>
|
|
87
|
+
0
|
|
88
|
+
|
|
89
|
+
> <polymerType>
|
|
90
|
+
RNA
|
|
91
|
+
|
|
92
|
+
> <symbol>
|
|
93
|
+
A
|
|
94
|
+
|
|
95
|
+
$$$$
|
|
96
|
+
HELM Core Monomer library
|
|
97
|
+
Ketcher 10061618102D 1 1.00000 0.00000 0
|
|
98
|
+
|
|
99
|
+
5 4 0 0 0 999 V2000
|
|
100
|
+
15.7527 -12.0837 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
101
|
+
15.7527 -13.0837 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
|
|
102
|
+
16.6188 -13.5837 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
103
|
+
15.2527 -13.9496 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
|
104
|
+
14.7868 -12.8248 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
|
105
|
+
1 2 1 0 0 0
|
|
106
|
+
2 3 1 0 0 0
|
|
107
|
+
2 4 2 0 0 0
|
|
108
|
+
2 5 1 0 0 0
|
|
109
|
+
A 1
|
|
110
|
+
R1
|
|
111
|
+
A 3
|
|
112
|
+
R2
|
|
113
|
+
M END
|
|
114
|
+
|
|
115
|
+
> <monomerType>
|
|
116
|
+
Backbone
|
|
117
|
+
|
|
118
|
+
> <author>
|
|
119
|
+
Pistoia Alliance HELM project
|
|
120
|
+
|
|
121
|
+
> <naturalAnalog>
|
|
122
|
+
p
|
|
123
|
+
|
|
124
|
+
> <createDate>
|
|
125
|
+
|
|
126
|
+
|
|
127
|
+
> <id>
|
|
128
|
+
0
|
|
129
|
+
|
|
130
|
+
> <polymerType>
|
|
131
|
+
RNA
|
|
132
|
+
|
|
133
|
+
> <symbol>
|
|
134
|
+
p
|
|
135
|
+
|
|
136
|
+
$$$$
|
|
@@ -0,0 +1,74 @@
|
|
|
1
|
+
[
|
|
2
|
+
{
|
|
3
|
+
"monomerType": "Backbone",
|
|
4
|
+
"smiles": "C[C@H](N[H:1])C([OH:2])=O",
|
|
5
|
+
"name": "Alanine",
|
|
6
|
+
"author": "Pistoia Alliance HELM project",
|
|
7
|
+
"molfile": "HELM Core Monomer library\n RDKit 2D\n\n 7 6 0 0 1 0 0 0 0 0999 V2000\n 2.0625 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.8250 1.4289 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 2.1434 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0\n 0.8250 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 -0.7145 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0\n 2 1 1 1\n 2 3 1 0\n 3 4 1 0\n 2 5 1 0\n 5 6 1 0\n 5 7 2 0\nM RGP 2 4 1 6 2\nM END\n",
|
|
8
|
+
"naturalAnalog": "A",
|
|
9
|
+
"rgroups": [
|
|
10
|
+
{
|
|
11
|
+
"capGroupSmiles": "[*:1][H]",
|
|
12
|
+
"alternateId": "R1-H",
|
|
13
|
+
"capGroupName": "H",
|
|
14
|
+
"label": "R1"
|
|
15
|
+
},
|
|
16
|
+
{
|
|
17
|
+
"capGroupSmiles": "O[*:2]",
|
|
18
|
+
"alternateId": "R2-OH",
|
|
19
|
+
"capGroupName": "OH",
|
|
20
|
+
"label": "R2"
|
|
21
|
+
}
|
|
22
|
+
],
|
|
23
|
+
"createDate": null,
|
|
24
|
+
"id": 0,
|
|
25
|
+
"polymerType": "PEPTIDE",
|
|
26
|
+
"symbol": "A"
|
|
27
|
+
},
|
|
28
|
+
{
|
|
29
|
+
"monomerType": "Branch",
|
|
30
|
+
"smiles": "[H:1]n1cnc2c(N)ncnc21",
|
|
31
|
+
"name": "Adenine",
|
|
32
|
+
"author": "Pistoia Alliance HELM project",
|
|
33
|
+
"molfile": "HELM Core Monomer library\n Ketcher 10131612512D 1 1.00000 0.00000 0\n\n 11 12 0 0 0 999 V2000\n 0.9632 -3.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0970 -4.0450 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0970 -5.0451 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.9630 -5.5451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 1.8291 -5.0452 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.8293 -4.0451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -0.8536 -5.3539 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -1.4413 -4.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n -0.8535 -3.7357 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 0.9632 -2.5448 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -1.1626 -6.3051 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1 10 1 0 0 0\n 1 6 2 0 0 0\n 1 2 1 0 0 0\n 9 2 1 0 0 0\n 2 3 2 0 0 0\n 7 3 1 0 0 0\n 3 4 1 0 0 0\n 4 5 2 0 0 0\n 5 6 1 0 0 0\n 7 8 1 0 0 0\n 7 11 1 0 0 0\n 8 9 2 0 0 0\nA 11\nR1\nM END\n",
|
|
34
|
+
"naturalAnalog": "A",
|
|
35
|
+
"rgroups": [
|
|
36
|
+
{
|
|
37
|
+
"capGroupSMILES": "[*:1][H]",
|
|
38
|
+
"alternateId": "R1-H",
|
|
39
|
+
"capGroupName": "H",
|
|
40
|
+
"label": "R1"
|
|
41
|
+
}
|
|
42
|
+
],
|
|
43
|
+
"symbol": "A",
|
|
44
|
+
"createDate": null,
|
|
45
|
+
"polymerType": "RNA",
|
|
46
|
+
"id": 0
|
|
47
|
+
},
|
|
48
|
+
{
|
|
49
|
+
"monomerType": "Backbone",
|
|
50
|
+
"smiles": "[OH:1]P([OH:2])(=O)O",
|
|
51
|
+
"name": "Phosphate",
|
|
52
|
+
"author": "Pistoia Alliance HELM project",
|
|
53
|
+
"molfile": "HELM Core Monomer library\n Ketcher 10061618102D 1 1.00000 0.00000 0\n\n 5 4 0 0 0 999 V2000\n 15.7527 -12.0837 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 15.7527 -13.0837 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0\n 16.6188 -13.5837 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 15.2527 -13.9496 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0\n 14.7868 -12.8248 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0\n 1 2 1 0 0 0\n 2 3 1 0 0 0\n 2 4 2 0 0 0\n 2 5 1 0 0 0\nA 1\nR1\nA 3\nR2\nM END\n",
|
|
54
|
+
"naturalAnalog": "p",
|
|
55
|
+
"rgroups": [
|
|
56
|
+
{
|
|
57
|
+
"capGroupSMILES": "O[*:1]",
|
|
58
|
+
"alternateId": "R1-OH",
|
|
59
|
+
"capGroupName": "OH",
|
|
60
|
+
"label": "R1"
|
|
61
|
+
},
|
|
62
|
+
{
|
|
63
|
+
"capGroupSMILES": "O[*:2]",
|
|
64
|
+
"alternateId": "R2-OH",
|
|
65
|
+
"capGroupName": "OH",
|
|
66
|
+
"label": "R2"
|
|
67
|
+
}
|
|
68
|
+
],
|
|
69
|
+
"symbol": "p",
|
|
70
|
+
"createDate": null,
|
|
71
|
+
"polymerType": "RNA",
|
|
72
|
+
"id": 0
|
|
73
|
+
}
|
|
74
|
+
]
|
|
@@ -0,0 +1,48 @@
|
|
|
1
|
+
[
|
|
2
|
+
{
|
|
3
|
+
"monomerType": "Backbone",
|
|
4
|
+
"smiles": "C[C@H](N[H:1])C([OH:2])=O",
|
|
5
|
+
"name": "Alanine",
|
|
6
|
+
"author": "Pistoia Alliance HELM project",
|
|
7
|
+
"molfile": "HELM Core Monomer library\n RDKit 2D\n\n 7 6 0 0 1 0 0 0 0 0999 V2000\n 2.0625 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.8250 1.4289 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 2.1434 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0\n 0.8250 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 -0.7145 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0\n 2 1 1 1\n 2 3 1 0\n 3 4 1 0\n 2 5 1 0\n 5 6 1 0\n 5 7 2 0\nM RGP 2 4 1 6 2\nM END\n",
|
|
8
|
+
"naturalAnalog": "A",
|
|
9
|
+
"rgroups": [
|
|
10
|
+
{
|
|
11
|
+
"capGroupSmiles": "[*:1][H]",
|
|
12
|
+
"alternateId": "R1-H",
|
|
13
|
+
"capGroupName": "H",
|
|
14
|
+
"label": "R1"
|
|
15
|
+
},
|
|
16
|
+
{
|
|
17
|
+
"capGroupSmiles": "O[*:2]",
|
|
18
|
+
"alternateId": "R2-OH",
|
|
19
|
+
"capGroupName": "OH",
|
|
20
|
+
"label": "R2"
|
|
21
|
+
}
|
|
22
|
+
],
|
|
23
|
+
"createDate": null,
|
|
24
|
+
"id": 0,
|
|
25
|
+
"polymerType": "PEPTIDE",
|
|
26
|
+
"symbol": "A"
|
|
27
|
+
},
|
|
28
|
+
{
|
|
29
|
+
"monomerType": "Branch",
|
|
30
|
+
"smiles": "[H:1]n1cnc2c(N)ncnc21",
|
|
31
|
+
"name": "Adenine",
|
|
32
|
+
"author": "Pistoia Alliance HELM project",
|
|
33
|
+
"molfile": "HELM Core Monomer library\n Ketcher 10131612512D 1 1.00000 0.00000 0\n\n 11 12 0 0 0 999 V2000\n 0.9632 -3.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0970 -4.0450 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0970 -5.0451 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.9630 -5.5451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 1.8291 -5.0452 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.8293 -4.0451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -0.8536 -5.3539 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -1.4413 -4.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n -0.8535 -3.7357 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 0.9632 -2.5448 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -1.1626 -6.3051 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1 10 1 0 0 0\n 1 6 2 0 0 0\n 1 2 1 0 0 0\n 9 2 1 0 0 0\n 2 3 2 0 0 0\n 7 3 1 0 0 0\n 3 4 1 0 0 0\n 4 5 2 0 0 0\n 5 6 1 0 0 0\n 7 8 1 0 0 0\n 7 11 1 0 0 0\n 8 9 2 0 0 0\nA 11\nR1\nM END\n",
|
|
34
|
+
"naturalAnalog": "A",
|
|
35
|
+
"rgroups": [
|
|
36
|
+
{
|
|
37
|
+
"capGroupSMILES": "[*:1][H]",
|
|
38
|
+
"alternateId": "R1-H",
|
|
39
|
+
"capGroupName": "H",
|
|
40
|
+
"label": "R1"
|
|
41
|
+
}
|
|
42
|
+
],
|
|
43
|
+
"symbol": "A",
|
|
44
|
+
"createDate": null,
|
|
45
|
+
"polymerType": "RNA",
|
|
46
|
+
"id": 0
|
|
47
|
+
}
|
|
48
|
+
]
|
|
@@ -0,0 +1,100 @@
|
|
|
1
|
+
cluster,sequence_id,sequence,activity,is_cliff
|
|
2
|
+
0,c0_seq89,KSKMMIFNTAENMYIM, 3.51,False
|
|
3
|
+
0,c0_seq90,NLTMMHQQTAEALAMM, 3.00,False
|
|
4
|
+
0,c0_seq91,RWTGMIQQTAVAMYPC, 2.84,False
|
|
5
|
+
0,c0_seq92,YIRMMIQCTAVAMANE, 2.80,False
|
|
6
|
+
0,c0_seq93,CKKGMIQCTAGNLYAK, 3.30,False
|
|
7
|
+
0,c0_seq94,DHRMMIFQTAGNLYSQ, 3.68,False
|
|
8
|
+
0,c0_seq95,DLKMMHQNTPGNMAQD, 4.93,True
|
|
9
|
+
0,c0_seq96,DLKMMHQNTAGNMAQD, 1.19,True
|
|
10
|
+
0,c0_seq97,KLKMMHFQTAGNLAQH, 3.26,False
|
|
11
|
+
0,c0_seq98,WIRMMHFCTAGAMAGH, 2.70,False
|
|
12
|
+
0,c0_seq99,TNTMMHQCTAVALAQR, 2.16,False
|
|
13
|
+
0,c0_seq100,VHTMMIFQTAEALYKY, 2.58,False
|
|
14
|
+
0,c0_seq101,FGTGMIFNTAGNMYMT, 3.28,False
|
|
15
|
+
0,c0_seq102,MVKGMHQQTAENMYDV, 3.41,False
|
|
16
|
+
0,c0_seq103,RMTGMIQCTAGALAKC, 2.49,False
|
|
17
|
+
0,c0_seq104,KMRMMHFNTAENMYLD, 3.43,False
|
|
18
|
+
0,c0_seq105,CRTMMIQNTAENLYFM, 3.06,False
|
|
19
|
+
0,c0_seq106,KSTGMIQCTAGAMYGT, 2.68,False
|
|
20
|
+
0,c0_seq107,VFTMMHFNTAEAMYHG, 2.92,False
|
|
21
|
+
0,c0_seq108,YPRMMIQCTAGNLAEE, 2.99,False
|
|
22
|
+
0,c0_seq109,LETMMHQQTAGNMYTN, 3.56,False
|
|
23
|
+
0,c0_seq110,SDKGMIFNTAENMYHS, 3.67,False
|
|
24
|
+
0,c0_seq111,SSRMMHQNTAVALAHR, 2.93,False
|
|
25
|
+
0,c0_seq112,QATGMIFNTAEAMYSV, 3.34,False
|
|
26
|
+
0,c0_seq113,AQTGMHFNTAENMYFC, 2.56,False
|
|
27
|
+
0,c0_seq114,TDRGMHQCTAVAMALG, 3.47,False
|
|
28
|
+
0,c0_seq115,WDTGMIFCTAGALYQI, 3.09,False
|
|
29
|
+
0,c0_seq116,HLKMMIFQTAVNLYDG, 2.86,False
|
|
30
|
+
0,c0_seq117,NNRGMIFNTAENLAGR, 2.67,False
|
|
31
|
+
0,c0_seq118,CFRGMHQQTAENMALH, 2.86,False
|
|
32
|
+
0,c0_seq119,PSKGMHQQTAVNMALD, 2.44,False
|
|
33
|
+
0,c0_seq120,CGKMMIQNTAVALYSS, 2.85,False
|
|
34
|
+
0,c0_seq121,WKRGMIQQTAVNLYVR, 3.70,False
|
|
35
|
+
0,c0_seq122,AWRGMHFNTAEALACL, 3.10,False
|
|
36
|
+
1,c1_seq639,PDNEWTKKNNWLATWK, 4.43,False
|
|
37
|
+
1,c1_seq640,NCNEMTSWRNILAASQ, 4.41,False
|
|
38
|
+
1,c1_seq641,QMNEWTSKNNTLATWE, 4.43,False
|
|
39
|
+
1,c1_seq642,LRNEWTSKNCILGTYN, 4.42,False
|
|
40
|
+
1,c1_seq643,ALNEWTSKRNNLGAWW, 4.41,False
|
|
41
|
+
1,c1_seq644,PANEMTKWRNKLATKC, 4.44,False
|
|
42
|
+
1,c1_seq645,CNNEWTKWRDLLAADF, 4.44,False
|
|
43
|
+
1,c1_seq646,QTNEMTKKRCTLVWFE, 4.49,True
|
|
44
|
+
1,c1_seq647,QTNEMTKKRCTLAWFE, 4.37,True
|
|
45
|
+
1,c1_seq648,VVNEMTKKNDRLGADL, 4.43,False
|
|
46
|
+
1,c1_seq649,PPNEMTSKRDYLGAEW, 4.41,False
|
|
47
|
+
1,c1_seq650,EQNEMTSKNNGLGTHD, 4.43,False
|
|
48
|
+
1,c1_seq651,WCNEWTSWNCILGANT, 4.43,False
|
|
49
|
+
1,c1_seq652,TWNEMTKKNDDLAAYQ, 4.43,False
|
|
50
|
+
1,c1_seq653,QQNEWTSKRDILGWSG, 4.43,False
|
|
51
|
+
1,c1_seq654,TFNEMTSWRNCLGAWI, 4.45,False
|
|
52
|
+
1,c1_seq655,CRNEWTSKRNNLGWYH, 4.42,False
|
|
53
|
+
1,c1_seq656,VLNEMTKWRNVLGTPN, 4.43,False
|
|
54
|
+
1,c1_seq657,IMNEWTKWNNMLGTEK, 4.43,False
|
|
55
|
+
1,c1_seq658,DFNEWTKWNCYLGWWK, 4.44,False
|
|
56
|
+
1,c1_seq659,HKNEMTKWNNMLGAEY, 4.44,False
|
|
57
|
+
1,c1_seq660,RRNEWTSKRDALGWVT, 4.42,False
|
|
58
|
+
1,c1_seq661,RENEWTKKRNYLAWQT, 4.42,False
|
|
59
|
+
1,c1_seq662,RHNEMTKWRCDLGTKS, 4.43,False
|
|
60
|
+
1,c1_seq663,SLNEMTSKNNALGTDH, 4.43,False
|
|
61
|
+
1,c1_seq664,DFNEMTSWNNNLGWMY, 4.42,False
|
|
62
|
+
1,c1_seq665,MGNEWTKWRDQLATKW, 4.42,False
|
|
63
|
+
1,c1_seq666,ELNEMTKWRNFLATEK, 4.41,False
|
|
64
|
+
1,c1_seq667,MQNEMTKWNNELAWQP, 4.45,False
|
|
65
|
+
1,c1_seq668,GRNEWTSKNCFLGTAG, 4.44,False
|
|
66
|
+
1,c1_seq669,FRNEWTSKRCHLGWEC, 4.40,False
|
|
67
|
+
2,c2_seq1022,WCEFRRFYICPQPVFH, 1.18,False
|
|
68
|
+
2,c2_seq1023,WWGFRGRYIDKEPVRS,-1.03,False
|
|
69
|
+
2,c2_seq1024,GKESDAIGGDRRPVNA, 1.24,False
|
|
70
|
+
2,c2_seq1025,MGYVYTEMGCLFPVQV, 0.69,False
|
|
71
|
+
2,c2_seq1026,QKYLDCLWMDYRPVNH, 3.84,True
|
|
72
|
+
2,c2_seq1027,QKYLDCLWGDYRPVNH,-2.81,True
|
|
73
|
+
2,c2_seq1028,MFELDLTNIDWYPVMM, 0.60,False
|
|
74
|
+
2,c2_seq1029,CSEYDASSICKCPVYV, 1.33,False
|
|
75
|
+
2,c2_seq1030,FHECRYSSGDSSPVAW,-0.33,False
|
|
76
|
+
2,c2_seq1031,QNEKRDLMGDLYPVCE, 0.63,False
|
|
77
|
+
2,c2_seq1032,VHEQRTKTGDDTPVAS, 0.41,False
|
|
78
|
+
2,c2_seq1033,FVEIYDRPGCCNPVAC,-0.92,False
|
|
79
|
+
2,c2_seq1034,KFEEYCLIICNRPVPD,-0.71,False
|
|
80
|
+
2,c2_seq1035,YSGARQELIDSEPVDD, 0.35,False
|
|
81
|
+
2,c2_seq1036,HLEWRLEHGDYWPVIA, 0.87,False
|
|
82
|
+
2,c2_seq1037,QFEWYAAPGDCGPVVW, 1.08,False
|
|
83
|
+
2,c2_seq1038,VMYSYPNRIDGCPVEV, 1.53,False
|
|
84
|
+
2,c2_seq1039,ECYYRQIDICATPVGV,-1.44,False
|
|
85
|
+
2,c2_seq1040,SLGAYCKNICFSPVYT,-0.81,False
|
|
86
|
+
2,c2_seq1041,SHECYVCWICMMPVYF,-0.18,False
|
|
87
|
+
2,c2_seq1042,EHGIYHPWICQDPVHI, 0.57,False
|
|
88
|
+
2,c2_seq1043,HVYAYSHEICTWPVQM, 0.16,False
|
|
89
|
+
2,c2_seq1044,VMYRDSFLGDKSPVNF, 1.70,False
|
|
90
|
+
2,c2_seq1045,ELGIYCPYGDMKPVVV, 0.79,False
|
|
91
|
+
2,c2_seq1046,RWESRRYKGCDRPVIV, 1.82,False
|
|
92
|
+
2,c2_seq1047,SSYTDSLSGDNHPVYQ, 0.47,False
|
|
93
|
+
2,c2_seq1048,LKYARSDCIDGIPVYH, 0.89,False
|
|
94
|
+
2,c2_seq1049,WDYYDKAHIDIGPVCQ, 0.65,False
|
|
95
|
+
2,c2_seq1050,NNYPRMCPICNFPVYI,-0.71,False
|
|
96
|
+
2,c2_seq1051,ADENDNHEGCNWPVNC,-0.06,False
|
|
97
|
+
2,c2_seq1052,NQYRREPRGCRSPVWK,-0.18,False
|
|
98
|
+
2,c2_seq1053,GMGWYQHFIDCMPVME, 0.39,False
|
|
99
|
+
2,c2_seq1054,HHEDYSSHGDRHPVAE, 0.34,False
|
|
100
|
+
2,c2_seq1055,WFYIRFWNGCMWPVDH, 0.63,False
|
|
@@ -0,0 +1,100 @@
|
|
|
1
|
+
cluster,sequence_id,sequence,activity,is_cliff
|
|
2
|
+
0,c0_seq89,KSKMMIFNTAENMYIM, 3.51,False
|
|
3
|
+
0,c0_seq90,NLTMMHQQTAEALAMM, 3.00,False
|
|
4
|
+
0,c0_seq91,RWTGMIQQTAVAMYPC, 2.84,False
|
|
5
|
+
0,c0_seq92,, 2.80,False
|
|
6
|
+
0,c0_seq93,CKKGMIQCTAGNLYAK, 3.30,False
|
|
7
|
+
0,c0_seq94,DHRMMIFQTAGNLYSQ, 3.68,False
|
|
8
|
+
0,c0_seq95,DLKMMHQNTPGNMAQD, 4.93,True
|
|
9
|
+
0,c0_seq96,DLKMMHQNTAGNMAQD, 1.19,True
|
|
10
|
+
0,c0_seq97,KLKMMHFQTAGNLAQH, 3.26,False
|
|
11
|
+
0,c0_seq98,WIRMMHFCTAGAMAGH, 2.70,False
|
|
12
|
+
0,c0_seq99,TNTMMHQCTAVALAQR, 2.16,False
|
|
13
|
+
0,c0_seq100,VHTMMIFQTAEALYKY, 2.58,False
|
|
14
|
+
0,c0_seq101,FGTGMIFNTAGNMYMT, 3.28,False
|
|
15
|
+
0,c0_seq102,MVKGMHQQTAENMYDV, 3.41,False
|
|
16
|
+
0,c0_seq103,RMTGMIQCTAGALAKC, 2.49,False
|
|
17
|
+
0,c0_seq104,KMRMMHFNTAENMYLD, 3.43,False
|
|
18
|
+
0,c0_seq105,CRTMMIQNTAENLYFM, 3.06,False
|
|
19
|
+
0,c0_seq106,KSTGMIQCTAGAMYGT, 2.68,False
|
|
20
|
+
0,c0_seq107,VFTMMHFNTAEAMYHG, 2.92,False
|
|
21
|
+
0,c0_seq108,YPRMMIQCTAGNLAEE, 2.99,False
|
|
22
|
+
0,c0_seq109,LETMMHQQTAGNMYTN, 3.56,False
|
|
23
|
+
0,c0_seq110,SDKGMIFNTAENMYHS, 3.67,False
|
|
24
|
+
0,c0_seq111,SSRMMHQNTAVALAHR, 2.93,False
|
|
25
|
+
0,c0_seq112,QATGMIFNTAEAMYSV, 3.34,False
|
|
26
|
+
0,c0_seq113,AQTGMHFNTAENMYFC, 2.56,False
|
|
27
|
+
0,c0_seq114,, 3.47,False
|
|
28
|
+
0,c0_seq115,WDTGMIFCTAGALYQI, 3.09,False
|
|
29
|
+
0,c0_seq116,HLKMMIFQTAVNLYDG, 2.86,False
|
|
30
|
+
0,c0_seq117,NNRGMIFNTAENLAGR, 2.67,False
|
|
31
|
+
0,c0_seq118,CFRGMHQQTAENMALH, 2.86,False
|
|
32
|
+
0,c0_seq119,PSKGMHQQTAVNMALD, 2.44,False
|
|
33
|
+
0,c0_seq120,CGKMMIQNTAVALYSS, 2.85,False
|
|
34
|
+
0,c0_seq121,WKRGMIQQTAVNLYVR, 3.70,False
|
|
35
|
+
0,c0_seq122,AWRGMHFNTAEALACL, 3.10,False
|
|
36
|
+
1,c1_seq639,PDNEWTKKNNWLATWK, 4.43,False
|
|
37
|
+
1,c1_seq640,NCNEMTSWRNILAASQ, 4.41,False
|
|
38
|
+
1,c1_seq641,QMNEWTSKNNTLATWE, 4.43,False
|
|
39
|
+
1,c1_seq642,LRNEWTSKNCILGTYN, 4.42,False
|
|
40
|
+
1,c1_seq643,ALNEWTSKRNNLGAWW, 4.41,False
|
|
41
|
+
1,c1_seq644,PANEMTKWRNKLATKC, 4.44,False
|
|
42
|
+
1,c1_seq645,CNNEWTKWRDLLAADF, 4.44,False
|
|
43
|
+
1,c1_seq646,QTNEMTKKRCTLVWFE, 4.49,True
|
|
44
|
+
1,c1_seq647,QTNEMTKKRCTLAWFE, 4.37,True
|
|
45
|
+
1,c1_seq648,VVNEMTKKNDRLGADL, 4.43,False
|
|
46
|
+
1,c1_seq649,PPNEMTSKRDYLGAEW, 4.41,False
|
|
47
|
+
1,c1_seq650,EQNEMTSKNNGLGTHD, 4.43,False
|
|
48
|
+
1,c1_seq651,WCNEWTSWNCILGANT, 4.43,False
|
|
49
|
+
1,c1_seq652,TWNEMTKKNDDLAAYQ, 4.43,False
|
|
50
|
+
1,c1_seq653,QQNEWTSKRDILGWSG, 4.43,False
|
|
51
|
+
1,c1_seq654,TFNEMTSWRNCLGAWI, 4.45,False
|
|
52
|
+
1,c1_seq655,CRNEWTSKRNNLGWYH, 4.42,False
|
|
53
|
+
1,c1_seq656,VLNEMTKWRNVLGTPN, 4.43,False
|
|
54
|
+
1,c1_seq657,IMNEWTKWNNMLGTEK, 4.43,False
|
|
55
|
+
1,c1_seq658,DFNEWTKWNCYLGWWK, 4.44,False
|
|
56
|
+
1,c1_seq659,HKNEMTKWNNMLGAEY, 4.44,False
|
|
57
|
+
1,c1_seq660,RRNEWTSKRDALGWVT, 4.42,False
|
|
58
|
+
1,c1_seq661,RENEWTKKRNYLAWQT, 4.42,False
|
|
59
|
+
1,c1_seq662,RHNEMTKWRCDLGTKS, 4.43,False
|
|
60
|
+
1,c1_seq663,SLNEMTSKNNALGTDH, 4.43,False
|
|
61
|
+
1,c1_seq664,DFNEMTSWNNNLGWMY, 4.42,False
|
|
62
|
+
1,c1_seq665,MGNEWTKWRDQLATKW, 4.42,False
|
|
63
|
+
1,c1_seq666,ELNEMTKWRNFLATEK, 4.41,False
|
|
64
|
+
1,c1_seq667,MQNEMTKWNNELAWQP, 4.45,False
|
|
65
|
+
1,c1_seq668,GRNEWTSKNCFLGTAG, 4.44,False
|
|
66
|
+
1,c1_seq669,FRNEWTSKRCHLGWEC, 4.40,False
|
|
67
|
+
2,c2_seq1022,WCEFRRFYICPQPVFH, 1.18,False
|
|
68
|
+
2,c2_seq1023,WWGFRGRYIDKEPVRS,-1.03,False
|
|
69
|
+
2,c2_seq1024,GKESDAIGGDRRPVNA, 1.24,False
|
|
70
|
+
2,c2_seq1025,MGYVYTEMGCLFPVQV, 0.69,False
|
|
71
|
+
2,c2_seq1026,QKYLDCLWMDYRPVNH, 3.84,True
|
|
72
|
+
2,c2_seq1027,QKYLDCLWGDYRPVNH,-2.81,True
|
|
73
|
+
2,c2_seq1028,MFELDLTNIDWYPVMM, 0.60,False
|
|
74
|
+
2,c2_seq1029,CSEYDASSICKCPVYV, 1.33,False
|
|
75
|
+
2,c2_seq1030,FHECRYSSGDSSPVAW,-0.33,False
|
|
76
|
+
2,c2_seq1031,QNEKRDLMGDLYPVCE, 0.63,False
|
|
77
|
+
2,c2_seq1032,VHEQRTKTGDDTPVAS, 0.41,False
|
|
78
|
+
2,c2_seq1033,FVEIYDRPGCCNPVAC,-0.92,False
|
|
79
|
+
2,c2_seq1034,KFEEYCLIICNRPVPD,-0.71,False
|
|
80
|
+
2,c2_seq1035,YSGARQELIDSEPVDD, 0.35,False
|
|
81
|
+
2,c2_seq1036,HLEWRLEHGDYWPVIA, 0.87,False
|
|
82
|
+
2,c2_seq1037,QFEWYAAPGDCGPVVW, 1.08,False
|
|
83
|
+
2,c2_seq1038,VMYSYPNRIDGCPVEV, 1.53,False
|
|
84
|
+
2,c2_seq1039,ECYYRQIDICATPVGV,-1.44,False
|
|
85
|
+
2,c2_seq1040,SLGAYCKNICFSPVYT,-0.81,False
|
|
86
|
+
2,c2_seq1041,SHECYVCWICMMPVYF,-0.18,False
|
|
87
|
+
2,c2_seq1042,EHGIYHPWICQDPVHI, 0.57,False
|
|
88
|
+
2,c2_seq1043,HVYAYSHEICTWPVQM, 0.16,False
|
|
89
|
+
2,c2_seq1044,VMYRDSFLGDKSPVNF, 1.70,False
|
|
90
|
+
2,c2_seq1045,ELGIYCPYGDMKPVVV, 0.79,False
|
|
91
|
+
2,c2_seq1046,RWESRRYKGCDRPVIV, 1.82,False
|
|
92
|
+
2,c2_seq1047,SSYTDSLSGDNHPVYQ, 0.47,False
|
|
93
|
+
2,c2_seq1048,LKYARSDCIDGIPVYH, 0.89,False
|
|
94
|
+
2,c2_seq1049,WDYYDKAHIDIGPVCQ, 0.65,False
|
|
95
|
+
2,c2_seq1050,NNYPRMCPICNFPVYI,-0.71,False
|
|
96
|
+
2,c2_seq1051,ADENDNHEGCNWPVNC,-0.06,False
|
|
97
|
+
2,c2_seq1052,NQYRREPRGCRSPVWK,-0.18,False
|
|
98
|
+
2,c2_seq1053,GMGWYQHFIDCMPVME, 0.39,False
|
|
99
|
+
2,c2_seq1054,HHEDYSSHGDRHPVAE, 0.34,False
|
|
100
|
+
2,c2_seq1055,WFYIRFWNGCMWPVDH, 0.63,False
|