@datagrok/bio 2.4.31 → 2.4.40

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (100) hide show
  1. package/.eslintrc.json +6 -8
  2. package/README.md +22 -7
  3. package/css/msa.css +3 -0
  4. package/detectors.js +21 -12
  5. package/dist/1.js +2 -0
  6. package/dist/1.js.map +1 -0
  7. package/dist/18.js +2 -0
  8. package/dist/18.js.map +1 -0
  9. package/dist/190.js +2 -0
  10. package/dist/190.js.map +1 -0
  11. package/dist/452.js +2 -0
  12. package/dist/452.js.map +1 -0
  13. package/dist/729.js +2 -0
  14. package/dist/729.js.map +1 -0
  15. package/dist/package-test.js +1 -1
  16. package/dist/package-test.js.map +1 -1
  17. package/dist/package.js +1 -1
  18. package/dist/package.js.map +1 -1
  19. package/files/libraries/broken-lib.sdf +136 -0
  20. package/files/libraries/group1/mock-lib-3.json +74 -0
  21. package/files/libraries/mock-lib-2.json +48 -0
  22. package/files/tests/100_3_clustests.csv +100 -0
  23. package/files/tests/100_3_clustests_empty_vals.csv +100 -0
  24. package/files/tests/peptides_motif-with-random_10000.csv +9998 -0
  25. package/package.json +4 -4
  26. package/scripts/sequence_generator.py +164 -48
  27. package/src/analysis/sequence-activity-cliffs.ts +7 -9
  28. package/src/analysis/sequence-diversity-viewer.ts +8 -3
  29. package/src/analysis/sequence-search-base-viewer.ts +4 -3
  30. package/src/analysis/sequence-similarity-viewer.ts +13 -7
  31. package/src/analysis/sequence-space.ts +15 -12
  32. package/src/analysis/workers/mm-distance-array-service.ts +48 -0
  33. package/src/analysis/workers/mm-distance-array-worker.ts +29 -0
  34. package/src/analysis/workers/mm-distance-worker-creator.ts +6 -9
  35. package/src/apps/web-logo-app.ts +34 -0
  36. package/src/calculations/monomerLevelMols.ts +10 -12
  37. package/src/demo/bio01-similarity-diversity.ts +4 -5
  38. package/src/demo/bio01a-hierarchical-clustering-and-sequence-space.ts +6 -7
  39. package/src/demo/bio01b-hierarchical-clustering-and-activity-cliffs.ts +7 -8
  40. package/src/demo/bio03-atomic-level.ts +1 -4
  41. package/src/demo/bio05-helm-msa-sequence-space.ts +6 -4
  42. package/src/demo/utils.ts +3 -4
  43. package/src/package-test.ts +1 -2
  44. package/src/package.ts +135 -82
  45. package/src/seq_align.ts +482 -483
  46. package/src/substructure-search/substructure-search.ts +3 -3
  47. package/src/tests/Palettes-test.ts +1 -1
  48. package/src/tests/WebLogo-positions-test.ts +12 -35
  49. package/src/tests/_first-tests.ts +1 -1
  50. package/src/tests/activity-cliffs-tests.ts +10 -7
  51. package/src/tests/activity-cliffs-utils.ts +6 -5
  52. package/src/tests/bio-tests.ts +20 -25
  53. package/src/tests/checkInputColumn-tests.ts +5 -11
  54. package/src/tests/converters-test.ts +19 -37
  55. package/src/tests/detectors-benchmark-tests.ts +35 -37
  56. package/src/tests/detectors-tests.ts +29 -34
  57. package/src/tests/detectors-weak-and-likely-tests.ts +11 -21
  58. package/src/tests/fasta-export-tests.ts +3 -3
  59. package/src/tests/fasta-handler-test.ts +2 -3
  60. package/src/tests/lib-tests.ts +2 -4
  61. package/src/tests/mm-distance-tests.ts +25 -17
  62. package/src/tests/monomer-libraries-tests.ts +1 -1
  63. package/src/tests/msa-tests.ts +12 -9
  64. package/src/tests/pepsea-tests.ts +6 -3
  65. package/src/tests/renderers-test.ts +13 -11
  66. package/src/tests/sequence-space-test.ts +10 -8
  67. package/src/tests/sequence-space-utils.ts +6 -4
  68. package/src/tests/similarity-diversity-tests.ts +47 -61
  69. package/src/tests/splitters-test.ts +14 -20
  70. package/src/tests/to-atomic-level-tests.ts +9 -17
  71. package/src/tests/units-handler-splitted-tests.ts +106 -0
  72. package/src/tests/units-handler-tests.ts +22 -26
  73. package/src/tests/utils/sequences-generators.ts +6 -2
  74. package/src/tests/utils.ts +10 -4
  75. package/src/tests/viewers.ts +1 -1
  76. package/src/utils/atomic-works.ts +49 -57
  77. package/src/utils/cell-renderer.ts +25 -8
  78. package/src/utils/check-input-column.ts +19 -4
  79. package/src/utils/constants.ts +3 -3
  80. package/src/utils/convert.ts +56 -23
  81. package/src/utils/monomer-lib.ts +83 -64
  82. package/src/utils/multiple-sequence-alignment-ui.ts +35 -21
  83. package/src/utils/multiple-sequence-alignment.ts +2 -2
  84. package/src/utils/pepsea.ts +17 -7
  85. package/src/utils/save-as-fasta.ts +11 -4
  86. package/src/utils/ui-utils.ts +1 -1
  87. package/src/viewers/vd-regions-viewer.ts +21 -22
  88. package/src/viewers/web-logo-viewer.ts +189 -154
  89. package/src/widgets/bio-substructure-filter.ts +9 -6
  90. package/src/widgets/representations.ts +11 -12
  91. package/tsconfig.json +1 -1
  92. package/dist/258.js +0 -2
  93. package/dist/258.js.map +0 -1
  94. package/dist/457.js +0 -2
  95. package/dist/457.js.map +0 -1
  96. package/dist/562.js +0 -2
  97. package/dist/562.js.map +0 -1
  98. package/dist/925.js +0 -2
  99. package/dist/925.js.map +0 -1
  100. package/src/analysis/workers/mm-distance-worker.ts +0 -16
@@ -0,0 +1,136 @@
1
+ HELM Core Monomer library
2
+ RDKit 2D
3
+
4
+ 7 6 0 0 1 0 0 0 0 0999 V2000
5
+ 2.0625 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
6
+ 1.2375 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
7
+ 0.8250 1.4289 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
8
+ 1.2375 2.1434 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0
9
+ 0.8250 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
10
+ 1.2375 -0.7145 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0
11
+ 0.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
12
+ 2 1 1 1
13
+ 2 3 1 0
14
+ 3 4 1 0
15
+ 2 5 1 0
16
+ 5 6 1 0
17
+ 5 7 2 0
18
+ M RGP 2 4 1 6 2
19
+ M END
20
+
21
+ > <monomerType>
22
+ Backbone
23
+
24
+ > <author>
25
+ Pistoia Alliance HELM project
26
+
27
+ > <naturalAnalog>
28
+ A
29
+
30
+ > <createDate>
31
+
32
+
33
+ > <id>
34
+ 0
35
+
36
+ > <polymerType>
37
+ PEPTIDE
38
+
39
+ > <symbol>
40
+ A
41
+
42
+ $$$$
43
+ HELM Core Monomer library
44
+ Ketcher 10131612512D 1 1.00000 0.00000 0
45
+
46
+ 11 12 0 0 0 999 V2000
47
+ 0.9632 -3.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
48
+ 0.0970 -4.0450 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
49
+ 0.0970 -5.0451 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
50
+ 0.9630 -5.5451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
51
+ 1.8291 -5.0452 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
52
+ 1.8293 -4.0451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
53
+ -0.8536 -5.3539 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
54
+ -1.4413 -4.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
55
+ -0.8535 -3.7357 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
56
+ 0.9632 -2.5448 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
57
+ -1.1626 -6.3051 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
58
+ 1 10 1 0 0 0
59
+ 1 6 2 0 0 0
60
+ 1 2 1 0 0 0
61
+ 9 2 1 0 0 0
62
+ 2 3 2 0 0 0
63
+ 7 3 1 0 0 0
64
+ 3 4 1 0 0 0
65
+ 4 5 2 0 0 0
66
+ 5 6 1 0 0 0
67
+ 7 8 1 0 0 0
68
+ 7 11 1 0 0 0
69
+ 8 9 2 0 0 0
70
+ A 11
71
+ R1
72
+ M END
73
+
74
+ > <monomerType>
75
+ Branch
76
+
77
+ > <author>
78
+ Pistoia Alliance HELM project
79
+
80
+ > <naturalAnalog>
81
+ A
82
+
83
+ > <createDate>
84
+
85
+
86
+ > <id>
87
+ 0
88
+
89
+ > <polymerType>
90
+ RNA
91
+
92
+ > <symbol>
93
+ A
94
+
95
+ $$$$
96
+ HELM Core Monomer library
97
+ Ketcher 10061618102D 1 1.00000 0.00000 0
98
+
99
+ 5 4 0 0 0 999 V2000
100
+ 15.7527 -12.0837 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
101
+ 15.7527 -13.0837 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
102
+ 16.6188 -13.5837 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
103
+ 15.2527 -13.9496 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
104
+ 14.7868 -12.8248 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
105
+ 1 2 1 0 0 0
106
+ 2 3 1 0 0 0
107
+ 2 4 2 0 0 0
108
+ 2 5 1 0 0 0
109
+ A 1
110
+ R1
111
+ A 3
112
+ R2
113
+ M END
114
+
115
+ > <monomerType>
116
+ Backbone
117
+
118
+ > <author>
119
+ Pistoia Alliance HELM project
120
+
121
+ > <naturalAnalog>
122
+ p
123
+
124
+ > <createDate>
125
+
126
+
127
+ > <id>
128
+ 0
129
+
130
+ > <polymerType>
131
+ RNA
132
+
133
+ > <symbol>
134
+ p
135
+
136
+ $$$$
@@ -0,0 +1,74 @@
1
+ [
2
+ {
3
+ "monomerType": "Backbone",
4
+ "smiles": "C[C@H](N[H:1])C([OH:2])=O",
5
+ "name": "Alanine",
6
+ "author": "Pistoia Alliance HELM project",
7
+ "molfile": "HELM Core Monomer library\n RDKit 2D\n\n 7 6 0 0 1 0 0 0 0 0999 V2000\n 2.0625 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.8250 1.4289 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 2.1434 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0\n 0.8250 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 -0.7145 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0\n 2 1 1 1\n 2 3 1 0\n 3 4 1 0\n 2 5 1 0\n 5 6 1 0\n 5 7 2 0\nM RGP 2 4 1 6 2\nM END\n",
8
+ "naturalAnalog": "A",
9
+ "rgroups": [
10
+ {
11
+ "capGroupSmiles": "[*:1][H]",
12
+ "alternateId": "R1-H",
13
+ "capGroupName": "H",
14
+ "label": "R1"
15
+ },
16
+ {
17
+ "capGroupSmiles": "O[*:2]",
18
+ "alternateId": "R2-OH",
19
+ "capGroupName": "OH",
20
+ "label": "R2"
21
+ }
22
+ ],
23
+ "createDate": null,
24
+ "id": 0,
25
+ "polymerType": "PEPTIDE",
26
+ "symbol": "A"
27
+ },
28
+ {
29
+ "monomerType": "Branch",
30
+ "smiles": "[H:1]n1cnc2c(N)ncnc21",
31
+ "name": "Adenine",
32
+ "author": "Pistoia Alliance HELM project",
33
+ "molfile": "HELM Core Monomer library\n Ketcher 10131612512D 1 1.00000 0.00000 0\n\n 11 12 0 0 0 999 V2000\n 0.9632 -3.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0970 -4.0450 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0970 -5.0451 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.9630 -5.5451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 1.8291 -5.0452 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.8293 -4.0451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -0.8536 -5.3539 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -1.4413 -4.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n -0.8535 -3.7357 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 0.9632 -2.5448 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -1.1626 -6.3051 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1 10 1 0 0 0\n 1 6 2 0 0 0\n 1 2 1 0 0 0\n 9 2 1 0 0 0\n 2 3 2 0 0 0\n 7 3 1 0 0 0\n 3 4 1 0 0 0\n 4 5 2 0 0 0\n 5 6 1 0 0 0\n 7 8 1 0 0 0\n 7 11 1 0 0 0\n 8 9 2 0 0 0\nA 11\nR1\nM END\n",
34
+ "naturalAnalog": "A",
35
+ "rgroups": [
36
+ {
37
+ "capGroupSMILES": "[*:1][H]",
38
+ "alternateId": "R1-H",
39
+ "capGroupName": "H",
40
+ "label": "R1"
41
+ }
42
+ ],
43
+ "symbol": "A",
44
+ "createDate": null,
45
+ "polymerType": "RNA",
46
+ "id": 0
47
+ },
48
+ {
49
+ "monomerType": "Backbone",
50
+ "smiles": "[OH:1]P([OH:2])(=O)O",
51
+ "name": "Phosphate",
52
+ "author": "Pistoia Alliance HELM project",
53
+ "molfile": "HELM Core Monomer library\n Ketcher 10061618102D 1 1.00000 0.00000 0\n\n 5 4 0 0 0 999 V2000\n 15.7527 -12.0837 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 15.7527 -13.0837 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0\n 16.6188 -13.5837 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 15.2527 -13.9496 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0\n 14.7868 -12.8248 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0\n 1 2 1 0 0 0\n 2 3 1 0 0 0\n 2 4 2 0 0 0\n 2 5 1 0 0 0\nA 1\nR1\nA 3\nR2\nM END\n",
54
+ "naturalAnalog": "p",
55
+ "rgroups": [
56
+ {
57
+ "capGroupSMILES": "O[*:1]",
58
+ "alternateId": "R1-OH",
59
+ "capGroupName": "OH",
60
+ "label": "R1"
61
+ },
62
+ {
63
+ "capGroupSMILES": "O[*:2]",
64
+ "alternateId": "R2-OH",
65
+ "capGroupName": "OH",
66
+ "label": "R2"
67
+ }
68
+ ],
69
+ "symbol": "p",
70
+ "createDate": null,
71
+ "polymerType": "RNA",
72
+ "id": 0
73
+ }
74
+ ]
@@ -0,0 +1,48 @@
1
+ [
2
+ {
3
+ "monomerType": "Backbone",
4
+ "smiles": "C[C@H](N[H:1])C([OH:2])=O",
5
+ "name": "Alanine",
6
+ "author": "Pistoia Alliance HELM project",
7
+ "molfile": "HELM Core Monomer library\n RDKit 2D\n\n 7 6 0 0 1 0 0 0 0 0999 V2000\n 2.0625 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 0.7145 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.8250 1.4289 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 2.1434 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0\n 0.8250 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.2375 -0.7145 0.0000 R# 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0\n 2 1 1 1\n 2 3 1 0\n 3 4 1 0\n 2 5 1 0\n 5 6 1 0\n 5 7 2 0\nM RGP 2 4 1 6 2\nM END\n",
8
+ "naturalAnalog": "A",
9
+ "rgroups": [
10
+ {
11
+ "capGroupSmiles": "[*:1][H]",
12
+ "alternateId": "R1-H",
13
+ "capGroupName": "H",
14
+ "label": "R1"
15
+ },
16
+ {
17
+ "capGroupSmiles": "O[*:2]",
18
+ "alternateId": "R2-OH",
19
+ "capGroupName": "OH",
20
+ "label": "R2"
21
+ }
22
+ ],
23
+ "createDate": null,
24
+ "id": 0,
25
+ "polymerType": "PEPTIDE",
26
+ "symbol": "A"
27
+ },
28
+ {
29
+ "monomerType": "Branch",
30
+ "smiles": "[H:1]n1cnc2c(N)ncnc21",
31
+ "name": "Adenine",
32
+ "author": "Pistoia Alliance HELM project",
33
+ "molfile": "HELM Core Monomer library\n Ketcher 10131612512D 1 1.00000 0.00000 0\n\n 11 12 0 0 0 999 V2000\n 0.9632 -3.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0970 -4.0450 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.0970 -5.0451 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 0.9630 -5.5451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 1.8291 -5.0452 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1.8293 -4.0451 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -0.8536 -5.3539 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -1.4413 -4.5449 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n -0.8535 -3.7357 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n 0.9632 -2.5448 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0\n -1.1626 -6.3051 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0\n 1 10 1 0 0 0\n 1 6 2 0 0 0\n 1 2 1 0 0 0\n 9 2 1 0 0 0\n 2 3 2 0 0 0\n 7 3 1 0 0 0\n 3 4 1 0 0 0\n 4 5 2 0 0 0\n 5 6 1 0 0 0\n 7 8 1 0 0 0\n 7 11 1 0 0 0\n 8 9 2 0 0 0\nA 11\nR1\nM END\n",
34
+ "naturalAnalog": "A",
35
+ "rgroups": [
36
+ {
37
+ "capGroupSMILES": "[*:1][H]",
38
+ "alternateId": "R1-H",
39
+ "capGroupName": "H",
40
+ "label": "R1"
41
+ }
42
+ ],
43
+ "symbol": "A",
44
+ "createDate": null,
45
+ "polymerType": "RNA",
46
+ "id": 0
47
+ }
48
+ ]
@@ -0,0 +1,100 @@
1
+ cluster,sequence_id,sequence,activity,is_cliff
2
+ 0,c0_seq89,KSKMMIFNTAENMYIM, 3.51,False
3
+ 0,c0_seq90,NLTMMHQQTAEALAMM, 3.00,False
4
+ 0,c0_seq91,RWTGMIQQTAVAMYPC, 2.84,False
5
+ 0,c0_seq92,YIRMMIQCTAVAMANE, 2.80,False
6
+ 0,c0_seq93,CKKGMIQCTAGNLYAK, 3.30,False
7
+ 0,c0_seq94,DHRMMIFQTAGNLYSQ, 3.68,False
8
+ 0,c0_seq95,DLKMMHQNTPGNMAQD, 4.93,True
9
+ 0,c0_seq96,DLKMMHQNTAGNMAQD, 1.19,True
10
+ 0,c0_seq97,KLKMMHFQTAGNLAQH, 3.26,False
11
+ 0,c0_seq98,WIRMMHFCTAGAMAGH, 2.70,False
12
+ 0,c0_seq99,TNTMMHQCTAVALAQR, 2.16,False
13
+ 0,c0_seq100,VHTMMIFQTAEALYKY, 2.58,False
14
+ 0,c0_seq101,FGTGMIFNTAGNMYMT, 3.28,False
15
+ 0,c0_seq102,MVKGMHQQTAENMYDV, 3.41,False
16
+ 0,c0_seq103,RMTGMIQCTAGALAKC, 2.49,False
17
+ 0,c0_seq104,KMRMMHFNTAENMYLD, 3.43,False
18
+ 0,c0_seq105,CRTMMIQNTAENLYFM, 3.06,False
19
+ 0,c0_seq106,KSTGMIQCTAGAMYGT, 2.68,False
20
+ 0,c0_seq107,VFTMMHFNTAEAMYHG, 2.92,False
21
+ 0,c0_seq108,YPRMMIQCTAGNLAEE, 2.99,False
22
+ 0,c0_seq109,LETMMHQQTAGNMYTN, 3.56,False
23
+ 0,c0_seq110,SDKGMIFNTAENMYHS, 3.67,False
24
+ 0,c0_seq111,SSRMMHQNTAVALAHR, 2.93,False
25
+ 0,c0_seq112,QATGMIFNTAEAMYSV, 3.34,False
26
+ 0,c0_seq113,AQTGMHFNTAENMYFC, 2.56,False
27
+ 0,c0_seq114,TDRGMHQCTAVAMALG, 3.47,False
28
+ 0,c0_seq115,WDTGMIFCTAGALYQI, 3.09,False
29
+ 0,c0_seq116,HLKMMIFQTAVNLYDG, 2.86,False
30
+ 0,c0_seq117,NNRGMIFNTAENLAGR, 2.67,False
31
+ 0,c0_seq118,CFRGMHQQTAENMALH, 2.86,False
32
+ 0,c0_seq119,PSKGMHQQTAVNMALD, 2.44,False
33
+ 0,c0_seq120,CGKMMIQNTAVALYSS, 2.85,False
34
+ 0,c0_seq121,WKRGMIQQTAVNLYVR, 3.70,False
35
+ 0,c0_seq122,AWRGMHFNTAEALACL, 3.10,False
36
+ 1,c1_seq639,PDNEWTKKNNWLATWK, 4.43,False
37
+ 1,c1_seq640,NCNEMTSWRNILAASQ, 4.41,False
38
+ 1,c1_seq641,QMNEWTSKNNTLATWE, 4.43,False
39
+ 1,c1_seq642,LRNEWTSKNCILGTYN, 4.42,False
40
+ 1,c1_seq643,ALNEWTSKRNNLGAWW, 4.41,False
41
+ 1,c1_seq644,PANEMTKWRNKLATKC, 4.44,False
42
+ 1,c1_seq645,CNNEWTKWRDLLAADF, 4.44,False
43
+ 1,c1_seq646,QTNEMTKKRCTLVWFE, 4.49,True
44
+ 1,c1_seq647,QTNEMTKKRCTLAWFE, 4.37,True
45
+ 1,c1_seq648,VVNEMTKKNDRLGADL, 4.43,False
46
+ 1,c1_seq649,PPNEMTSKRDYLGAEW, 4.41,False
47
+ 1,c1_seq650,EQNEMTSKNNGLGTHD, 4.43,False
48
+ 1,c1_seq651,WCNEWTSWNCILGANT, 4.43,False
49
+ 1,c1_seq652,TWNEMTKKNDDLAAYQ, 4.43,False
50
+ 1,c1_seq653,QQNEWTSKRDILGWSG, 4.43,False
51
+ 1,c1_seq654,TFNEMTSWRNCLGAWI, 4.45,False
52
+ 1,c1_seq655,CRNEWTSKRNNLGWYH, 4.42,False
53
+ 1,c1_seq656,VLNEMTKWRNVLGTPN, 4.43,False
54
+ 1,c1_seq657,IMNEWTKWNNMLGTEK, 4.43,False
55
+ 1,c1_seq658,DFNEWTKWNCYLGWWK, 4.44,False
56
+ 1,c1_seq659,HKNEMTKWNNMLGAEY, 4.44,False
57
+ 1,c1_seq660,RRNEWTSKRDALGWVT, 4.42,False
58
+ 1,c1_seq661,RENEWTKKRNYLAWQT, 4.42,False
59
+ 1,c1_seq662,RHNEMTKWRCDLGTKS, 4.43,False
60
+ 1,c1_seq663,SLNEMTSKNNALGTDH, 4.43,False
61
+ 1,c1_seq664,DFNEMTSWNNNLGWMY, 4.42,False
62
+ 1,c1_seq665,MGNEWTKWRDQLATKW, 4.42,False
63
+ 1,c1_seq666,ELNEMTKWRNFLATEK, 4.41,False
64
+ 1,c1_seq667,MQNEMTKWNNELAWQP, 4.45,False
65
+ 1,c1_seq668,GRNEWTSKNCFLGTAG, 4.44,False
66
+ 1,c1_seq669,FRNEWTSKRCHLGWEC, 4.40,False
67
+ 2,c2_seq1022,WCEFRRFYICPQPVFH, 1.18,False
68
+ 2,c2_seq1023,WWGFRGRYIDKEPVRS,-1.03,False
69
+ 2,c2_seq1024,GKESDAIGGDRRPVNA, 1.24,False
70
+ 2,c2_seq1025,MGYVYTEMGCLFPVQV, 0.69,False
71
+ 2,c2_seq1026,QKYLDCLWMDYRPVNH, 3.84,True
72
+ 2,c2_seq1027,QKYLDCLWGDYRPVNH,-2.81,True
73
+ 2,c2_seq1028,MFELDLTNIDWYPVMM, 0.60,False
74
+ 2,c2_seq1029,CSEYDASSICKCPVYV, 1.33,False
75
+ 2,c2_seq1030,FHECRYSSGDSSPVAW,-0.33,False
76
+ 2,c2_seq1031,QNEKRDLMGDLYPVCE, 0.63,False
77
+ 2,c2_seq1032,VHEQRTKTGDDTPVAS, 0.41,False
78
+ 2,c2_seq1033,FVEIYDRPGCCNPVAC,-0.92,False
79
+ 2,c2_seq1034,KFEEYCLIICNRPVPD,-0.71,False
80
+ 2,c2_seq1035,YSGARQELIDSEPVDD, 0.35,False
81
+ 2,c2_seq1036,HLEWRLEHGDYWPVIA, 0.87,False
82
+ 2,c2_seq1037,QFEWYAAPGDCGPVVW, 1.08,False
83
+ 2,c2_seq1038,VMYSYPNRIDGCPVEV, 1.53,False
84
+ 2,c2_seq1039,ECYYRQIDICATPVGV,-1.44,False
85
+ 2,c2_seq1040,SLGAYCKNICFSPVYT,-0.81,False
86
+ 2,c2_seq1041,SHECYVCWICMMPVYF,-0.18,False
87
+ 2,c2_seq1042,EHGIYHPWICQDPVHI, 0.57,False
88
+ 2,c2_seq1043,HVYAYSHEICTWPVQM, 0.16,False
89
+ 2,c2_seq1044,VMYRDSFLGDKSPVNF, 1.70,False
90
+ 2,c2_seq1045,ELGIYCPYGDMKPVVV, 0.79,False
91
+ 2,c2_seq1046,RWESRRYKGCDRPVIV, 1.82,False
92
+ 2,c2_seq1047,SSYTDSLSGDNHPVYQ, 0.47,False
93
+ 2,c2_seq1048,LKYARSDCIDGIPVYH, 0.89,False
94
+ 2,c2_seq1049,WDYYDKAHIDIGPVCQ, 0.65,False
95
+ 2,c2_seq1050,NNYPRMCPICNFPVYI,-0.71,False
96
+ 2,c2_seq1051,ADENDNHEGCNWPVNC,-0.06,False
97
+ 2,c2_seq1052,NQYRREPRGCRSPVWK,-0.18,False
98
+ 2,c2_seq1053,GMGWYQHFIDCMPVME, 0.39,False
99
+ 2,c2_seq1054,HHEDYSSHGDRHPVAE, 0.34,False
100
+ 2,c2_seq1055,WFYIRFWNGCMWPVDH, 0.63,False
@@ -0,0 +1,100 @@
1
+ cluster,sequence_id,sequence,activity,is_cliff
2
+ 0,c0_seq89,KSKMMIFNTAENMYIM, 3.51,False
3
+ 0,c0_seq90,NLTMMHQQTAEALAMM, 3.00,False
4
+ 0,c0_seq91,RWTGMIQQTAVAMYPC, 2.84,False
5
+ 0,c0_seq92,, 2.80,False
6
+ 0,c0_seq93,CKKGMIQCTAGNLYAK, 3.30,False
7
+ 0,c0_seq94,DHRMMIFQTAGNLYSQ, 3.68,False
8
+ 0,c0_seq95,DLKMMHQNTPGNMAQD, 4.93,True
9
+ 0,c0_seq96,DLKMMHQNTAGNMAQD, 1.19,True
10
+ 0,c0_seq97,KLKMMHFQTAGNLAQH, 3.26,False
11
+ 0,c0_seq98,WIRMMHFCTAGAMAGH, 2.70,False
12
+ 0,c0_seq99,TNTMMHQCTAVALAQR, 2.16,False
13
+ 0,c0_seq100,VHTMMIFQTAEALYKY, 2.58,False
14
+ 0,c0_seq101,FGTGMIFNTAGNMYMT, 3.28,False
15
+ 0,c0_seq102,MVKGMHQQTAENMYDV, 3.41,False
16
+ 0,c0_seq103,RMTGMIQCTAGALAKC, 2.49,False
17
+ 0,c0_seq104,KMRMMHFNTAENMYLD, 3.43,False
18
+ 0,c0_seq105,CRTMMIQNTAENLYFM, 3.06,False
19
+ 0,c0_seq106,KSTGMIQCTAGAMYGT, 2.68,False
20
+ 0,c0_seq107,VFTMMHFNTAEAMYHG, 2.92,False
21
+ 0,c0_seq108,YPRMMIQCTAGNLAEE, 2.99,False
22
+ 0,c0_seq109,LETMMHQQTAGNMYTN, 3.56,False
23
+ 0,c0_seq110,SDKGMIFNTAENMYHS, 3.67,False
24
+ 0,c0_seq111,SSRMMHQNTAVALAHR, 2.93,False
25
+ 0,c0_seq112,QATGMIFNTAEAMYSV, 3.34,False
26
+ 0,c0_seq113,AQTGMHFNTAENMYFC, 2.56,False
27
+ 0,c0_seq114,, 3.47,False
28
+ 0,c0_seq115,WDTGMIFCTAGALYQI, 3.09,False
29
+ 0,c0_seq116,HLKMMIFQTAVNLYDG, 2.86,False
30
+ 0,c0_seq117,NNRGMIFNTAENLAGR, 2.67,False
31
+ 0,c0_seq118,CFRGMHQQTAENMALH, 2.86,False
32
+ 0,c0_seq119,PSKGMHQQTAVNMALD, 2.44,False
33
+ 0,c0_seq120,CGKMMIQNTAVALYSS, 2.85,False
34
+ 0,c0_seq121,WKRGMIQQTAVNLYVR, 3.70,False
35
+ 0,c0_seq122,AWRGMHFNTAEALACL, 3.10,False
36
+ 1,c1_seq639,PDNEWTKKNNWLATWK, 4.43,False
37
+ 1,c1_seq640,NCNEMTSWRNILAASQ, 4.41,False
38
+ 1,c1_seq641,QMNEWTSKNNTLATWE, 4.43,False
39
+ 1,c1_seq642,LRNEWTSKNCILGTYN, 4.42,False
40
+ 1,c1_seq643,ALNEWTSKRNNLGAWW, 4.41,False
41
+ 1,c1_seq644,PANEMTKWRNKLATKC, 4.44,False
42
+ 1,c1_seq645,CNNEWTKWRDLLAADF, 4.44,False
43
+ 1,c1_seq646,QTNEMTKKRCTLVWFE, 4.49,True
44
+ 1,c1_seq647,QTNEMTKKRCTLAWFE, 4.37,True
45
+ 1,c1_seq648,VVNEMTKKNDRLGADL, 4.43,False
46
+ 1,c1_seq649,PPNEMTSKRDYLGAEW, 4.41,False
47
+ 1,c1_seq650,EQNEMTSKNNGLGTHD, 4.43,False
48
+ 1,c1_seq651,WCNEWTSWNCILGANT, 4.43,False
49
+ 1,c1_seq652,TWNEMTKKNDDLAAYQ, 4.43,False
50
+ 1,c1_seq653,QQNEWTSKRDILGWSG, 4.43,False
51
+ 1,c1_seq654,TFNEMTSWRNCLGAWI, 4.45,False
52
+ 1,c1_seq655,CRNEWTSKRNNLGWYH, 4.42,False
53
+ 1,c1_seq656,VLNEMTKWRNVLGTPN, 4.43,False
54
+ 1,c1_seq657,IMNEWTKWNNMLGTEK, 4.43,False
55
+ 1,c1_seq658,DFNEWTKWNCYLGWWK, 4.44,False
56
+ 1,c1_seq659,HKNEMTKWNNMLGAEY, 4.44,False
57
+ 1,c1_seq660,RRNEWTSKRDALGWVT, 4.42,False
58
+ 1,c1_seq661,RENEWTKKRNYLAWQT, 4.42,False
59
+ 1,c1_seq662,RHNEMTKWRCDLGTKS, 4.43,False
60
+ 1,c1_seq663,SLNEMTSKNNALGTDH, 4.43,False
61
+ 1,c1_seq664,DFNEMTSWNNNLGWMY, 4.42,False
62
+ 1,c1_seq665,MGNEWTKWRDQLATKW, 4.42,False
63
+ 1,c1_seq666,ELNEMTKWRNFLATEK, 4.41,False
64
+ 1,c1_seq667,MQNEMTKWNNELAWQP, 4.45,False
65
+ 1,c1_seq668,GRNEWTSKNCFLGTAG, 4.44,False
66
+ 1,c1_seq669,FRNEWTSKRCHLGWEC, 4.40,False
67
+ 2,c2_seq1022,WCEFRRFYICPQPVFH, 1.18,False
68
+ 2,c2_seq1023,WWGFRGRYIDKEPVRS,-1.03,False
69
+ 2,c2_seq1024,GKESDAIGGDRRPVNA, 1.24,False
70
+ 2,c2_seq1025,MGYVYTEMGCLFPVQV, 0.69,False
71
+ 2,c2_seq1026,QKYLDCLWMDYRPVNH, 3.84,True
72
+ 2,c2_seq1027,QKYLDCLWGDYRPVNH,-2.81,True
73
+ 2,c2_seq1028,MFELDLTNIDWYPVMM, 0.60,False
74
+ 2,c2_seq1029,CSEYDASSICKCPVYV, 1.33,False
75
+ 2,c2_seq1030,FHECRYSSGDSSPVAW,-0.33,False
76
+ 2,c2_seq1031,QNEKRDLMGDLYPVCE, 0.63,False
77
+ 2,c2_seq1032,VHEQRTKTGDDTPVAS, 0.41,False
78
+ 2,c2_seq1033,FVEIYDRPGCCNPVAC,-0.92,False
79
+ 2,c2_seq1034,KFEEYCLIICNRPVPD,-0.71,False
80
+ 2,c2_seq1035,YSGARQELIDSEPVDD, 0.35,False
81
+ 2,c2_seq1036,HLEWRLEHGDYWPVIA, 0.87,False
82
+ 2,c2_seq1037,QFEWYAAPGDCGPVVW, 1.08,False
83
+ 2,c2_seq1038,VMYSYPNRIDGCPVEV, 1.53,False
84
+ 2,c2_seq1039,ECYYRQIDICATPVGV,-1.44,False
85
+ 2,c2_seq1040,SLGAYCKNICFSPVYT,-0.81,False
86
+ 2,c2_seq1041,SHECYVCWICMMPVYF,-0.18,False
87
+ 2,c2_seq1042,EHGIYHPWICQDPVHI, 0.57,False
88
+ 2,c2_seq1043,HVYAYSHEICTWPVQM, 0.16,False
89
+ 2,c2_seq1044,VMYRDSFLGDKSPVNF, 1.70,False
90
+ 2,c2_seq1045,ELGIYCPYGDMKPVVV, 0.79,False
91
+ 2,c2_seq1046,RWESRRYKGCDRPVIV, 1.82,False
92
+ 2,c2_seq1047,SSYTDSLSGDNHPVYQ, 0.47,False
93
+ 2,c2_seq1048,LKYARSDCIDGIPVYH, 0.89,False
94
+ 2,c2_seq1049,WDYYDKAHIDIGPVCQ, 0.65,False
95
+ 2,c2_seq1050,NNYPRMCPICNFPVYI,-0.71,False
96
+ 2,c2_seq1051,ADENDNHEGCNWPVNC,-0.06,False
97
+ 2,c2_seq1052,NQYRREPRGCRSPVWK,-0.18,False
98
+ 2,c2_seq1053,GMGWYQHFIDCMPVME, 0.39,False
99
+ 2,c2_seq1054,HHEDYSSHGDRHPVAE, 0.34,False
100
+ 2,c2_seq1055,WFYIRFWNGCMWPVDH, 0.63,False