geney 1.3.53__py2.py3-none-any.whl → 1.3.55__py2.py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of geney might be problematic. Click here for more details.
- geney/SeqMats.py +4 -3
- geney/oncosplice.py +5 -4
- {geney-1.3.53.dist-info → geney-1.3.55.dist-info}/METADATA +1 -1
- {geney-1.3.53.dist-info → geney-1.3.55.dist-info}/RECORD +6 -6
- {geney-1.3.53.dist-info → geney-1.3.55.dist-info}/WHEEL +0 -0
- {geney-1.3.53.dist-info → geney-1.3.55.dist-info}/top_level.txt +0 -0
geney/SeqMats.py
CHANGED
|
@@ -363,13 +363,14 @@ class SeqMat:
|
|
|
363
363
|
raw_seq = temp.seq # Extract the raw sequence
|
|
364
364
|
pattern = re.compile(r"(?:[NACGT]{3})*?(TAA|TAG|TGA)")
|
|
365
365
|
# match = pattern.match(raw_seq)
|
|
366
|
-
match = [(m.group(), m.start()) for m in re.finditer(r"(?:[NACGT]{3})*?(TAA|TAG|TGA)", raw_seq) if
|
|
367
|
-
(m.start()
|
|
366
|
+
match = [(m.group(), m.start()+1) for m in re.finditer(r"(?:[NACGT]{3})*?(TAA|TAG|TGA)", raw_seq) if
|
|
367
|
+
(m.start()+1) % 3 == 0]
|
|
368
368
|
|
|
369
369
|
if len(match) > 0:
|
|
370
370
|
stop_index = match[0][-1] #.end()
|
|
371
371
|
else:
|
|
372
|
-
stop_index = len(raw_seq)
|
|
372
|
+
stop_index = len(raw_seq) - (len(raw_seq) % 3)
|
|
373
|
+
|
|
373
374
|
end_index = stop_index
|
|
374
375
|
# assert (end_index+1) % 3 == 0, f"{end_index} is not a multiple of 3"
|
|
375
376
|
return SeqMat(temp.seqmat[:, :end_index])
|
geney/oncosplice.py
CHANGED
|
@@ -319,14 +319,15 @@ def oncosplice(mut_id, splicing_threshold=0.5, protein_coding=True, cons_require
|
|
|
319
319
|
|
|
320
320
|
results = []
|
|
321
321
|
for reference_transcript in tqdm(gene, desc=f'Processing {mut_id}...'):
|
|
322
|
-
if (cons_required and not reference_transcript.cons_available) or (
|
|
323
|
-
|
|
324
|
-
|
|
322
|
+
# if (cons_required and not reference_transcript.cons_available) or (
|
|
323
|
+
# protein_coding and not reference_transcript.transcript_biotype == 'protein_coding'):
|
|
324
|
+
if protein_coding and not reference_transcript.transcript_biotype == 'protein_coding':
|
|
325
|
+
print("Not protein coding...")
|
|
325
326
|
continue
|
|
326
327
|
|
|
327
328
|
current_mutations = [m for m in mutations if m in reference_transcript]
|
|
328
329
|
if len(current_mutations) == 0:
|
|
329
|
-
print("No mutations within transcript...")
|
|
330
|
+
print(f"No mutations within transcript ({reference_transcript.transcript_start} > {reference_transcript.transcript_end})...")
|
|
330
331
|
continue
|
|
331
332
|
|
|
332
333
|
center = np.mean([m.indices[0] for m in current_mutations]) // 1
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
geney/Fasta_segment.py,sha256=99HxNGNh_MfdVW6hhtlb1vOn7eSmT7oFoEfHDFMxG8w,11275
|
|
2
2
|
geney/Gene.py,sha256=nMWJjoQaiVFm2iRjoiq7ghZqnXtW0tJDcq2S0AyOIvY,6883
|
|
3
|
-
geney/SeqMats.py,sha256=
|
|
3
|
+
geney/SeqMats.py,sha256=AKR1EhyDhOaEhavrkXSrVjYsohB6Qvsq11Udy7SGwvs,19238
|
|
4
4
|
geney/Transcript.py,sha256=CpfxYkuCwFILozrtLuiWnlr1mRnMKn4o84HVJislgYs,14499
|
|
5
5
|
geney/__init__.py,sha256=eBdDl42N6UhcYeZDjOnv199Z88fI5_8Y6xW8447OKXM,755
|
|
6
6
|
geney/_mutation_utils.py,sha256=dHssUsnii_mf-wuRoMmF13UlD7k3ml_VwQMItTYnXpU,1132
|
|
@@ -11,7 +11,7 @@ geney/graphic_utils.py,sha256=oMsBpB9YeEn96gGpKh4MmtagJffWZbk-xPrIwHvkFhA,11016
|
|
|
11
11
|
geney/gtex_utils.py,sha256=asL2lHyU5KsbWpV096vkf1Ka7hSo_RRfZqw7p5nERmE,1919
|
|
12
12
|
geney/immune_utils.py,sha256=ZRni5ttrhpYBnmNr0d0ZatIbNPYs4nmQuoUO00SpsS4,5271
|
|
13
13
|
geney/mutation_utils.py,sha256=C_kv2MB_L8LlhX3W2ooXjJ3uDoJ8zX1WeDtZKoBZJkI,1547
|
|
14
|
-
geney/oncosplice.py,sha256
|
|
14
|
+
geney/oncosplice.py,sha256=-WlZRRkrZGF9hNT9CEJJUBxeeR0lKy2Yo9kzjPYC8Ok,24579
|
|
15
15
|
geney/pangolin_utils.py,sha256=9jdBXlOcRaUdfi-UpUxHA0AkTMZkUF-Lt7HVZ1nEm3s,2973
|
|
16
16
|
geney/power_utils.py,sha256=MehZFUdkJ2EFUot709yPEDxSkXmH5XevMebX2HD768A,7330
|
|
17
17
|
geney/seqmat_utils.py,sha256=wzb3PX5it5bpIFQvcxyzlxfhoJTbHHbsjg0rzh05iVs,19753
|
|
@@ -25,7 +25,7 @@ geney/translation_initiation/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NM
|
|
|
25
25
|
geney/translation_initiation/tis_utils.py,sha256=AF3siFjuQH-Rs44EV-80zHdbxRMvN4woLFSHroWIETc,4448
|
|
26
26
|
geney/translation_initiation/resources/kozak_pssm.json,sha256=pcd0Olziutq-6H3mFWDCD9cujQ_AlZO-iiOvBl82hqE,1165
|
|
27
27
|
geney/translation_initiation/resources/tis_regressor_model.joblib,sha256=IXb4DUDhJ5rBDKcqMk9zE3ECTZZcdj7Jixz3KpoZ7OA,2592025
|
|
28
|
-
geney-1.3.
|
|
29
|
-
geney-1.3.
|
|
30
|
-
geney-1.3.
|
|
31
|
-
geney-1.3.
|
|
28
|
+
geney-1.3.55.dist-info/METADATA,sha256=kLdJrug4ERJSEvhw28dSYyHv7Ax4PYtWtcRfvlFVpsY,990
|
|
29
|
+
geney-1.3.55.dist-info/WHEEL,sha256=AHX6tWk3qWuce7vKLrj7lnulVHEdWoltgauo8bgCXgU,109
|
|
30
|
+
geney-1.3.55.dist-info/top_level.txt,sha256=O-FuNUMb5fn9dhZ-dYCgF0aZtfi1EslMstnzhc5IIVo,6
|
|
31
|
+
geney-1.3.55.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|