python-katlas 0.1.3__tar.gz → 2025.10.20__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/LICENSE +0 -0
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/MANIFEST.in +0 -0
- {python_katlas-0.1.3/python_katlas.egg-info → python_katlas-2025.10.20}/PKG-INFO +148 -110
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/README.md +118 -100
- python_katlas-2025.10.20/katlas/__init__.py +1 -0
- python_katlas-2025.10.20/katlas/_modidx.py +213 -0
- python_katlas-2025.10.20/katlas/clustering.py +142 -0
- python_katlas-2025.10.20/katlas/common.py +3 -0
- python_katlas-2025.10.20/katlas/core.py +6 -0
- python_katlas-2025.10.20/katlas/data.py +446 -0
- python_katlas-2025.10.20/katlas/dnn.py +384 -0
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/katlas/feature.py +136 -111
- python_katlas-2025.10.20/katlas/pathway.py +156 -0
- python_katlas-2025.10.20/katlas/plot.py +879 -0
- python_katlas-2025.10.20/katlas/pssm.py +784 -0
- python_katlas-2025.10.20/katlas/score.py +364 -0
- python_katlas-2025.10.20/katlas/statistics.py +102 -0
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/katlas/train.py +51 -77
- python_katlas-2025.10.20/katlas/utils.py +176 -0
- python_katlas-2025.10.20/pyproject.toml +11 -0
- {python_katlas-0.1.3 → python_katlas-2025.10.20/python_katlas.egg-info}/PKG-INFO +148 -110
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/python_katlas.egg-info/SOURCES.txt +10 -2
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/python_katlas.egg-info/requires.txt +15 -8
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/settings.ini +4 -4
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/setup.py +0 -0
- python_katlas-0.1.3/katlas/__init__.py +0 -1
- python_katlas-0.1.3/katlas/_modidx.py +0 -109
- python_katlas-0.1.3/katlas/core.py +0 -816
- python_katlas-0.1.3/katlas/dl.py +0 -357
- python_katlas-0.1.3/katlas/imports.py +0 -7
- python_katlas-0.1.3/katlas/plot.py +0 -665
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/python_katlas.egg-info/dependency_links.txt +0 -0
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/python_katlas.egg-info/entry_points.txt +0 -0
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/python_katlas.egg-info/not-zip-safe +0 -0
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/python_katlas.egg-info/top_level.txt +0 -0
- {python_katlas-0.1.3 → python_katlas-2025.10.20}/setup.cfg +0 -0
|
File without changes
|
|
File without changes
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
Metadata-Version: 2.
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
2
|
Name: python-katlas
|
|
3
|
-
Version:
|
|
3
|
+
Version: 2025.10.20
|
|
4
4
|
Summary: tools for predicting kinome specificities
|
|
5
5
|
Home-page: https://github.com/sky1ove/katlas
|
|
6
6
|
Author: lily
|
|
@@ -18,36 +18,51 @@ Classifier: License :: OSI Approved :: Apache Software License
|
|
|
18
18
|
Requires-Python: >=3.7
|
|
19
19
|
Description-Content-Type: text/markdown
|
|
20
20
|
License-File: LICENSE
|
|
21
|
+
Requires-Dist: pandas
|
|
22
|
+
Requires-Dist: gdown
|
|
21
23
|
Requires-Dist: statsmodels
|
|
22
24
|
Requires-Dist: fastparquet
|
|
25
|
+
Requires-Dist: pyarrow
|
|
23
26
|
Requires-Dist: tqdm
|
|
27
|
+
Requires-Dist: logomaker-kinase
|
|
28
|
+
Requires-Dist: seaborn
|
|
29
|
+
Requires-Dist: bokeh
|
|
30
|
+
Requires-Dist: reactome2py
|
|
31
|
+
Requires-Dist: adjustText
|
|
32
|
+
Requires-Dist: scikit-learn
|
|
33
|
+
Requires-Dist: umap-learn
|
|
34
|
+
Requires-Dist: ipywidgets
|
|
35
|
+
Requires-Dist: biopython
|
|
24
36
|
Provides-Extra: dev
|
|
25
37
|
Requires-Dist: nbdev; extra == "dev"
|
|
26
38
|
Requires-Dist: pyngrok; extra == "dev"
|
|
27
|
-
Requires-Dist: fastai
|
|
28
|
-
Requires-Dist: fastbook; extra == "dev"
|
|
39
|
+
Requires-Dist: fastai; extra == "dev"
|
|
29
40
|
Requires-Dist: fairscale; extra == "dev"
|
|
30
41
|
Requires-Dist: fair-esm; extra == "dev"
|
|
31
|
-
Requires-Dist: logomaker; extra == "dev"
|
|
32
|
-
Requires-Dist: seaborn; extra == "dev"
|
|
33
42
|
Requires-Dist: rdkit; extra == "dev"
|
|
34
|
-
Requires-Dist: umap-learn; extra == "dev"
|
|
35
|
-
Requires-Dist: adjustText; extra == "dev"
|
|
36
|
-
Requires-Dist: bokeh; extra == "dev"
|
|
37
|
-
Requires-Dist: scikit-learn>=1.3.0; extra == "dev"
|
|
38
43
|
Requires-Dist: openpyxl; extra == "dev"
|
|
44
|
+
Requires-Dist: transformers; extra == "dev"
|
|
45
|
+
Requires-Dist: sentencepiece; extra == "dev"
|
|
46
|
+
Dynamic: author
|
|
47
|
+
Dynamic: author-email
|
|
48
|
+
Dynamic: classifier
|
|
49
|
+
Dynamic: description
|
|
50
|
+
Dynamic: description-content-type
|
|
51
|
+
Dynamic: home-page
|
|
52
|
+
Dynamic: keywords
|
|
53
|
+
Dynamic: license
|
|
54
|
+
Dynamic: license-file
|
|
55
|
+
Dynamic: provides-extra
|
|
56
|
+
Dynamic: requires-dist
|
|
57
|
+
Dynamic: requires-python
|
|
58
|
+
Dynamic: summary
|
|
39
59
|
|
|
40
60
|
# KATLAS
|
|
41
61
|
|
|
42
62
|
|
|
43
63
|
<!-- WARNING: THIS FILE WAS AUTOGENERATED! DO NOT EDIT! -->
|
|
44
64
|
|
|
45
|
-
<img alt="Katlas logo" width="600" caption="Katlas logo" src="https://github.com/sky1ove/katlas/raw/main/
|
|
46
|
-
|
|
47
|
-
<a target="_blank" href="https://colab.research.google.com/github/sky1ove/katlas/blob/main/nbs/index.ipynb">
|
|
48
|
-
<img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/>
|
|
49
|
-
</a> <a href="https://pypi.org/project/python-katlas/">
|
|
50
|
-
<img src="https://img.shields.io/pypi/v/python-katlas?link=https%3A%2F%2Fpypi.org%2Fproject%2Fpython-katlas%2F" alt="PyPI"></a>
|
|
65
|
+
<img alt="Katlas logo" width="600" caption="Katlas logo" src="https://github.com/sky1ove/katlas/raw/main/logo.png" id="logo"/>
|
|
51
66
|
|
|
52
67
|
KATLAS is a repository containing python tools to predict kinases given
|
|
53
68
|
a substrate sequence. It also contains datasets of kinase substrate
|
|
@@ -93,26 +108,24 @@ code.
|
|
|
93
108
|
Check out our latest web platform:
|
|
94
109
|
[kinase-atlas.com](https://kinase-atlas.com/)
|
|
95
110
|
|
|
96
|
-
##
|
|
111
|
+
## Install
|
|
97
112
|
|
|
98
|
-
|
|
99
|
-
sequence](https://colab.research.google.com/github/sky1ove/katlas/blob/main/nbs/tutorial_01_sinlge_input.ipynb)
|
|
100
|
-
- 2. [High throughput substrate scoring on phosphoproteomics
|
|
101
|
-
dataset](https://colab.research.google.com/github/sky1ove/katlas/blob/main/nbs/tutorial_02_high_throughput.ipynb)
|
|
102
|
-
- 3. [Kinase enrichment analysis for AKT
|
|
103
|
-
inhibitor](https://colab.research.google.com/github/sky1ove/katlas/blob/main/nbs/tutorial_03a_enrichment_AKTi.ipynb)
|
|
113
|
+
UV:
|
|
104
114
|
|
|
105
|
-
|
|
115
|
+
``` bash
|
|
116
|
+
uv add -U git+https://github.com/sky1ove/katlas.git
|
|
117
|
+
```
|
|
106
118
|
|
|
107
|
-
|
|
119
|
+
pip:
|
|
108
120
|
|
|
109
|
-
|
|
110
|
-
|
|
121
|
+
``` bash
|
|
122
|
+
pip install -U git+https://github.com/sky1ove/katlas.git
|
|
123
|
+
```
|
|
111
124
|
|
|
112
125
|
## Import
|
|
113
126
|
|
|
114
127
|
``` python
|
|
115
|
-
from katlas.
|
|
128
|
+
from katlas.common import *
|
|
116
129
|
```
|
|
117
130
|
|
|
118
131
|
# Quick start
|
|
@@ -132,93 +145,101 @@ For input sequences, we also consider it in two conditions:
|
|
|
132
145
|
- all capital
|
|
133
146
|
- contains lower cases indicating phosphorylation status
|
|
134
147
|
|
|
135
|
-
##
|
|
148
|
+
## Quick start
|
|
136
149
|
|
|
137
|
-
###
|
|
150
|
+
### Site scoring
|
|
151
|
+
|
|
152
|
+
CDDM, all capital
|
|
138
153
|
|
|
139
154
|
``` python
|
|
140
|
-
predict_kinase('
|
|
155
|
+
predict_kinase('AAAAAAASGAGSDN',**Params("CDDM_upper"))
|
|
141
156
|
```
|
|
142
157
|
|
|
143
|
-
considering string: ['-7A', '-6A', '-5A', '-4A', '-3A', '-2A', '-1A', '0S', '1G', '
|
|
158
|
+
considering string: ['-7A', '-6A', '-5A', '-4A', '-3A', '-2A', '-1A', '0S', '1G', '2A', '3G', '4S', '5D', '6N']
|
|
144
159
|
|
|
145
|
-
|
|
146
|
-
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
154
|
-
|
|
155
|
-
|
|
156
|
-
|
|
157
|
-
Length: 289, dtype: float64
|
|
160
|
+
GCN2 4.556
|
|
161
|
+
MPSK1 4.425
|
|
162
|
+
MEKK2 4.253
|
|
163
|
+
WNK3 4.213
|
|
164
|
+
WNK1 4.064
|
|
165
|
+
...
|
|
166
|
+
PDK1 -25.077
|
|
167
|
+
PDHK3 -25.346
|
|
168
|
+
CLK2 -27.251
|
|
169
|
+
ROR2 -27.582
|
|
170
|
+
DDR1 -53.581
|
|
171
|
+
Length: 328, dtype: float64
|
|
158
172
|
|
|
159
|
-
|
|
173
|
+
CDDM, with lower case indicating phosphorylation status
|
|
160
174
|
|
|
161
175
|
``` python
|
|
162
|
-
predict_kinase('AAAAAAAsGGAGsDN',**
|
|
176
|
+
predict_kinase('AAAAAAAsGGAGsDN',**Params("CDDM"))
|
|
163
177
|
```
|
|
164
178
|
|
|
165
179
|
considering string: ['-7A', '-6A', '-5A', '-4A', '-3A', '-2A', '-1A', '0s', '1G', '2G', '3A', '4G', '5s', '6D', '7N']
|
|
166
180
|
|
|
167
|
-
|
|
168
|
-
|
|
169
|
-
|
|
170
|
-
|
|
171
|
-
|
|
172
|
-
|
|
173
|
-
|
|
174
|
-
|
|
175
|
-
|
|
176
|
-
|
|
177
|
-
|
|
178
|
-
|
|
179
|
-
|
|
180
|
-
|
|
181
|
-
### PSPA, with lower case indicating phosphorylation status
|
|
181
|
+
ROR1 8.355
|
|
182
|
+
WNK1 4.907
|
|
183
|
+
WNK2 4.782
|
|
184
|
+
ERK5 4.466
|
|
185
|
+
RIPK2 4.045
|
|
186
|
+
...
|
|
187
|
+
DDR1 -29.393
|
|
188
|
+
TNNI3K -29.884
|
|
189
|
+
CHAK1 -31.775
|
|
190
|
+
VRK1 -45.287
|
|
191
|
+
BRAF -49.403
|
|
192
|
+
Length: 328, dtype: float64
|
|
193
|
+
|
|
194
|
+
PSPA, with lower case indicating phosphorylation status
|
|
182
195
|
|
|
183
196
|
``` python
|
|
184
|
-
predict_kinase('AEEKEyHsEGG',**
|
|
197
|
+
predict_kinase('AEEKEyHsEGG',**Params("PSPA"))
|
|
185
198
|
```
|
|
186
199
|
|
|
187
200
|
considering string: ['-5A', '-4E', '-3E', '-2K', '-1E', '0y', '1H', '2s', '3E', '4G', '5G']
|
|
188
201
|
|
|
189
202
|
kinase
|
|
190
|
-
EGFR
|
|
191
|
-
FGFR4
|
|
192
|
-
ZAP70
|
|
193
|
-
CSK
|
|
194
|
-
SYK
|
|
195
|
-
|
|
196
|
-
|
|
197
|
-
|
|
203
|
+
EGFR 4.013
|
|
204
|
+
FGFR4 3.568
|
|
205
|
+
ZAP70 3.412
|
|
206
|
+
CSK 3.241
|
|
207
|
+
SYK 3.209
|
|
208
|
+
...
|
|
209
|
+
JAK1 -3.837
|
|
210
|
+
DDR2 -4.421
|
|
211
|
+
TNK2 -4.534
|
|
212
|
+
TNNI3K_TYR -4.651
|
|
213
|
+
TNK1 -5.320
|
|
214
|
+
Length: 93, dtype: float64
|
|
215
|
+
|
|
216
|
+
To replicate the results from The Kinase Library (PSPA)
|
|
198
217
|
|
|
199
218
|
Check this link: [The Kinase
|
|
200
|
-
Library](https://kinase-library.
|
|
219
|
+
Library](https://kinase-library.mit.edu/site?s=AEEKEy*HSEGG&pp=false&scp=true),
|
|
201
220
|
and use log2(score) to rank, it shows same results with the below (with
|
|
202
221
|
slight differences due to rounding).
|
|
203
222
|
|
|
204
223
|
``` python
|
|
205
|
-
predict_kinase('AEEKEyHSEGG',**
|
|
224
|
+
out = predict_kinase('AEEKEyHSEGG',**Params("PSPA"))
|
|
225
|
+
out
|
|
206
226
|
```
|
|
207
227
|
|
|
208
228
|
considering string: ['-5A', '-4E', '-3E', '-2K', '-1E', '0y', '1H', '2S', '3E', '4G', '5G']
|
|
209
229
|
|
|
210
230
|
kinase
|
|
211
|
-
EGFR
|
|
212
|
-
FGFR4
|
|
213
|
-
CSK
|
|
214
|
-
ZAP70
|
|
215
|
-
SYK
|
|
216
|
-
|
|
217
|
-
|
|
218
|
-
|
|
219
|
-
|
|
220
|
-
|
|
221
|
-
|
|
231
|
+
EGFR 3.181
|
|
232
|
+
FGFR4 2.390
|
|
233
|
+
CSK 2.308
|
|
234
|
+
ZAP70 2.068
|
|
235
|
+
SYK 1.998
|
|
236
|
+
...
|
|
237
|
+
EPHA1 -3.501
|
|
238
|
+
FES -3.699
|
|
239
|
+
TNK1 -4.269
|
|
240
|
+
TNK2 -4.577
|
|
241
|
+
DDR2 -4.920
|
|
242
|
+
Length: 93, dtype: float64
|
|
222
243
|
|
|
223
244
|
- So far [The kinase Library](https://kinase-library.phosphosite.org)
|
|
224
245
|
considers all ***tyr sequences*** in capital regardless of whether or
|
|
@@ -234,8 +255,10 @@ sheet.
|
|
|
234
255
|
``` python
|
|
235
256
|
# Percentile reference sheet
|
|
236
257
|
y_pct = Data.get_pspa_tyr_pct()
|
|
258
|
+
```
|
|
237
259
|
|
|
238
|
-
|
|
260
|
+
``` python
|
|
261
|
+
get_pct('AEEKEyHSEGG',pct_ref = y_pct,**Params("PSPA_y"))
|
|
239
262
|
```
|
|
240
263
|
|
|
241
264
|
considering string: ['-5A', '-4E', '-3E', '-2K', '-1E', '0Y', '1H', '2S', '3E', '4G', '5G']
|
|
@@ -270,15 +293,15 @@ get_pct('AEEKEyHSEGG',**param_PSPA_y, pct_ref = y_pct)
|
|
|
270
293
|
<p>93 rows × 2 columns</p>
|
|
271
294
|
</div>
|
|
272
295
|
|
|
273
|
-
|
|
296
|
+
### Site scoring in a df
|
|
274
297
|
|
|
275
|
-
|
|
298
|
+
Load your csv:
|
|
276
299
|
|
|
277
300
|
``` python
|
|
278
301
|
# df = pd.read_csv('your_file.csv')
|
|
279
302
|
```
|
|
280
303
|
|
|
281
|
-
|
|
304
|
+
Or load a demo df
|
|
282
305
|
|
|
283
306
|
``` python
|
|
284
307
|
# Load a demo df with phosphorylation sites
|
|
@@ -309,22 +332,21 @@ df.iloc[:,-2:]
|
|
|
309
332
|
|
|
310
333
|
</div>
|
|
311
334
|
|
|
312
|
-
|
|
335
|
+
Set the column name and param to calculate
|
|
313
336
|
|
|
314
337
|
Here we choose param_CDDM_upper, as the sequences in the demo df are all
|
|
315
338
|
in capital. You can also choose other params.
|
|
316
339
|
|
|
317
340
|
``` python
|
|
318
|
-
results = predict_kinase_df(df,'site_seq',**
|
|
341
|
+
results = predict_kinase_df(df,'site_seq',**Params("CDDM_upper"))
|
|
319
342
|
results
|
|
320
343
|
```
|
|
321
344
|
|
|
322
345
|
input dataframe has a length 5
|
|
323
346
|
Preprocessing
|
|
324
347
|
Finish preprocessing
|
|
325
|
-
|
|
326
|
-
|
|
327
|
-
100%|██████████| 289/289 [00:05<00:00, 56.64it/s]
|
|
348
|
+
Merging reference
|
|
349
|
+
Finish merging
|
|
328
350
|
|
|
329
351
|
<div>
|
|
330
352
|
<style scoped>
|
|
@@ -339,18 +361,35 @@ results
|
|
|
339
361
|
}
|
|
340
362
|
</style>
|
|
341
363
|
|
|
342
|
-
|
|
|
364
|
+
| | SRC | EPHA3 | FES | NTRK3 | ALK | ABL1 | FLT3 | EPHA8 | EPHB2 | EPHB1 | ... | VRK1 | PKMYT1 | GRK3 | CAMK1B | CDC7 | SMMLCK | ROR1 | GAK | MAST2 | BRAF |
|
|
343
365
|
|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|
|
|
344
|
-
| 0 |
|
|
345
|
-
| 1 |
|
|
346
|
-
| 2 |
|
|
347
|
-
| 3 |
|
|
348
|
-
| 4 |
|
|
366
|
+
| 0 | -2.440640 | -0.818753 | -1.663990 | -0.738991 | -2.047628 | -3.602344 | -3.200998 | -0.935176 | -1.388444 | -1.859450 | ... | -17.103237 | -113.698143 | -16.848783 | -41.520172 | -41.646187 | 1.284159 | -26.566362 | -69.165062 | -17.706400 | -87.763214 |
|
|
367
|
+
| 1 | -3.838486 | -2.735969 | -2.533986 | -2.150399 | -3.792498 | -4.725527 | -5.711791 | -4.534240 | -3.148449 | -2.511518 | ... | -67.889053 | -68.652641 | -45.833855 | -64.171600 | -39.465572 | -65.061722 | -109.561707 | -85.911224 | -60.105064 | -63.889122 |
|
|
368
|
+
| 2 | -2.610423 | -2.370090 | -3.235637 | -1.508413 | -2.571347 | -3.740941 | -3.025596 | -3.373504 | -2.776297 | -3.060740 | ... | -15.798462 | -45.905319 | -61.440742 | -67.695694 | -55.047962 | -42.135216 | -38.501572 | -62.624382 | -56.119389 | -107.060989 |
|
|
369
|
+
| 3 | -5.180541 | -4.201880 | -5.766463 | -3.038421 | -3.836897 | -4.249900 | -5.029885 | -5.411311 | -4.713308 | -4.827825 | ... | -96.978317 | -83.419777 | -22.559393 | -110.611588 | -63.283070 | -37.240440 | -24.497492 | -112.878151 | -43.538158 | -60.348518 |
|
|
370
|
+
| 4 | -2.844254 | -3.322700 | -3.681745 | -1.766435 | -2.666579 | -3.748774 | -4.083619 | -3.912834 | -3.724181 | -3.948160 | ... | -35.824612 | -87.983566 | -83.312317 | -107.162407 | -61.478374 | -85.793571 | -43.738819 | -47.004211 | -42.281624 | -59.518513 |
|
|
349
371
|
|
|
350
|
-
<p>5 rows ×
|
|
372
|
+
<p>5 rows × 328 columns</p>
|
|
351
373
|
</div>
|
|
352
374
|
|
|
353
|
-
|
|
375
|
+
``` python
|
|
376
|
+
results.iloc[0].sort_values(ascending=False)
|
|
377
|
+
```
|
|
378
|
+
|
|
379
|
+
TLK2 8.264621
|
|
380
|
+
GCN2 8.101542
|
|
381
|
+
TLK1 7.693897
|
|
382
|
+
HRI 6.691402
|
|
383
|
+
PLK3 6.579368
|
|
384
|
+
...
|
|
385
|
+
NIK -64.605148
|
|
386
|
+
SRPK2 -67.300667
|
|
387
|
+
GAK -69.165062
|
|
388
|
+
BRAF -87.763214
|
|
389
|
+
PKMYT1 -113.698143
|
|
390
|
+
Name: 0, Length: 328, dtype: float32
|
|
391
|
+
|
|
392
|
+
## Dataset
|
|
354
393
|
|
|
355
394
|
Besides calculating sequence scores, we also provides multiple datasets
|
|
356
395
|
of phosphorylation sites.
|
|
@@ -405,9 +444,9 @@ df.head(3)
|
|
|
405
444
|
|
|
406
445
|
| | uniprot | position | residue | is_disopred | disopred_score | log10_hotspot_pval_min | isHotspot | uniprot_position | functional_score | current_uniprot | name | gene | Sequence | is_valid | site_seq | gene_site |
|
|
407
446
|
|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|----|
|
|
408
|
-
| 0 | A0A075B6Q4 | 24 | S |
|
|
409
|
-
| 1 | A0A075B6Q4 | 35 | S |
|
|
410
|
-
| 2 | A0A075B6Q4 | 57 | S |
|
|
447
|
+
| 0 | A0A075B6Q4 | 24 | S | 1.0 | 0.91 | 6.839384 | 1.0 | A0A075B6Q4_24 | 0.149257 | A0A075B6Q4 | A0A075B6Q4_HUMAN | None | MDIQKSENEDDSEWEDVDDEKGDSNDDYDSAGLLSDEDCMSVPGKT... | True | VDDEKGDSNDDYDSA | A0A075B6Q4_S24 |
|
|
448
|
+
| 1 | A0A075B6Q4 | 35 | S | 1.0 | 0.87 | 9.192622 | 0.0 | A0A075B6Q4_35 | 0.136966 | A0A075B6Q4 | A0A075B6Q4_HUMAN | None | MDIQKSENEDDSEWEDVDDEKGDSNDDYDSAGLLSDEDCMSVPGKT... | True | YDSAGLLSDEDCMSV | A0A075B6Q4_S35 |
|
|
449
|
+
| 2 | A0A075B6Q4 | 57 | S | 0.0 | 0.28 | 0.818834 | 0.0 | A0A075B6Q4_57 | 0.125364 | A0A075B6Q4 | A0A075B6Q4_HUMAN | None | MDIQKSENEDDSEWEDVDDEKGDSNDDYDSAGLLSDEDCMSVPGKT... | True | IADHLFWSEETKSRF | A0A075B6Q4_S57 |
|
|
411
450
|
|
|
412
451
|
</div>
|
|
413
452
|
|
|
@@ -459,13 +498,12 @@ df.head(3)
|
|
|
459
498
|
}
|
|
460
499
|
</style>
|
|
461
500
|
|
|
462
|
-
| |
|
|
463
|
-
|
|
464
|
-
| 0 |
|
|
465
|
-
| 1 |
|
|
466
|
-
| 2 |
|
|
501
|
+
| | uniprot | gene | site | site_seq | source | AM_pathogenicity | CDDM_upper | CDDM_max_score |
|
|
502
|
+
|----|----|----|----|----|----|----|----|----|
|
|
503
|
+
| 0 | A0A024R4G9 | C19orf48 | S20 | ITGSRLLSMVPGPAR | psp | NaN | PRKX,AKT1,PKG1,P90RSK,HIPK4,AKT3,HIPK1,PKACB,H... | 2.407041 |
|
|
504
|
+
| 1 | A0A075B6Q4 | None | S24 | VDDEKGDSNDDYDSA | ochoa | NaN | CK2A2,CK2A1,GRK7,GRK5,CK1G1,CK1A,IKKA,CK1G2,CA... | 2.295654 |
|
|
505
|
+
| 2 | A0A075B6Q4 | None | S35 | YDSAGLLSDEDCMSV | ochoa | NaN | CK2A2,CK2A1,IKKA,ATM,IKKB,CAMK1D,MARK2,GRK7,IK... | 2.488683 |
|
|
467
506
|
|
|
468
|
-
<p>3 rows × 21 columns</p>
|
|
469
507
|
</div>
|
|
470
508
|
|
|
471
509
|
## Phosphorylation site sequence example
|