ORForise 1.6.1__tar.gz → 1.6.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {orforise-1.6.1 → orforise-1.6.2}/PKG-INFO +6 -6
- {orforise-1.6.1 → orforise-1.6.2}/README.md +5 -5
- {orforise-1.6.1 → orforise-1.6.2}/pyproject.toml +1 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aggregate_Compare.py +3 -5
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Annotation_Compare.py +4 -3
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Annotation_Intersector.py +2 -2
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Comparator.py +3 -2
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Convert_To_GFF.py +5 -3
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/GFF_Adder.py +3 -3
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/List_Tools.py +3 -10
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/StORForise.py +3 -3
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/Augustus/Augustus.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/Balrog/Balrog.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/FGENESB/FGENESB.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/FragGeneScan/FragGeneScan.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/GFF/GFF.py +13 -2
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/GLIMMER3/GLIMMER3.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/GeneMark/GeneMark.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/GeneMarkHA/GeneMarkHA.py +21 -9
- orforise-1.6.1/src/ORForise/Tools/GeneMark_HMM/GeneMark_HMM.py → orforise-1.6.2/src/ORForise/Tools/GeneMarkHMM/GeneMarkHMM.py +22 -10
- orforise-1.6.1/src/ORForise/Tools/GeneMark_S/GeneMark_S.py → orforise-1.6.2/src/ORForise/Tools/GeneMarkS/GeneMarkS.py +22 -10
- orforise-1.6.1/src/ORForise/Tools/GeneMark_S_2/GeneMark_S_2.py → orforise-1.6.2/src/ORForise/Tools/GeneMarkS2/GeneMarkS2.py +23 -11
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/MetaGene/MetaGene.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/MetaGeneAnnotator/MetaGeneAnnotator.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/MetaGeneMark/MetaGeneMark.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/Prodigal/Prodigal.py +3 -3
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/Prokka/Prokka.py +14 -2
- orforise-1.6.1/src/ORForise/Tools/StORF_Reporter/StORF_Reporter.py → orforise-1.6.2/src/ORForise/Tools/StORF-Reporter/StORF-Reporter.py +14 -2
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/TransDecoder/TransDecoder.py +13 -1
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise.egg-info/PKG-INFO +6 -6
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise.egg-info/SOURCES.txt +8 -8
- {orforise-1.6.1 → orforise-1.6.2}/LICENSE +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/setup.cfg +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/StORF_Undetected/Completely_Undetected/Completey_Undetected.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/StORF_Undetected/Completely_Undetected/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/StORF_Undetected/StORF_Undetected.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/StORF_Undetected/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/StORF_Undetected/unvitiated_Genes/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/StORF_Undetected/unvitiated_Genes/unvitiated_Missed_Genes.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/TabToGFF/TabToGFF.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/TabToGFF/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/cds_checker.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/gene_Lenghts.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/genome_Metrics.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/hypothetical_gene_predictions.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/missed_Gene_Metrics.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/parital_Match_Analysis.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/result_File_Analysis.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/start_Codon_Substitution.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/Augustus/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/Balrog/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/EasyGene/EasyGene.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/EasyGene/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/FGENESB/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/FragGeneScan/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/GFF/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/GLIMMER3/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/GeneMark/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/GeneMarkHA/__init__.py +0 -0
- {orforise-1.6.1/src/ORForise/Tools/GeneMark_HMM → orforise-1.6.2/src/ORForise/Tools/GeneMarkHMM}/__init__.py +0 -0
- {orforise-1.6.1/src/ORForise/Tools/GeneMark_S → orforise-1.6.2/src/ORForise/Tools/GeneMarkS}/__init__.py +0 -0
- {orforise-1.6.1/src/ORForise/Tools/GeneMark_S_2 → orforise-1.6.2/src/ORForise/Tools/GeneMarkS2}/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/MetaGene/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/MetaGeneAnnotator/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/MetaGeneMark/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/Prodigal/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/Prokka/__init__.py +0 -0
- {orforise-1.6.1/src/ORForise/Tools/StORF_Reporter → orforise-1.6.2/src/ORForise/Tools/StORF-Reporter}/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/TransDecoder/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Tools/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/__init__.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise/utils.py +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise.egg-info/dependency_links.txt +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise.egg-info/entry_points.txt +0 -0
- {orforise-1.6.1 → orforise-1.6.2}/src/ORForise.egg-info/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: ORForise
|
|
3
|
-
Version: 1.6.
|
|
3
|
+
Version: 1.6.2
|
|
4
4
|
Summary: ORForise - A platform for analysing and comparing genome annotations.
|
|
5
5
|
Author-email: Nicholas Dimonaco <nicholas@dimonaco.co.uk>
|
|
6
6
|
License: GNU GENERAL PUBLIC LICENSE
|
|
@@ -662,7 +662,7 @@ Example output files from ```Annotation-Compare```, ```Aggregate-Compare```, ```
|
|
|
662
662
|
For Help: ```Annotation-Compare -h ```
|
|
663
663
|
|
|
664
664
|
```python
|
|
665
|
-
ORForise v1.6.
|
|
665
|
+
ORForise v1.6.2: Annotatione-Compare Run Parameters.
|
|
666
666
|
|
|
667
667
|
Required Arguments:
|
|
668
668
|
-dna GENOME_DNA Genome DNA file (.fa) which both annotations are based on
|
|
@@ -730,7 +730,7 @@ ORForise can be used as the example below.
|
|
|
730
730
|
For Help: ```Aggregate-Compare -h ```
|
|
731
731
|
|
|
732
732
|
```python
|
|
733
|
-
ORForise v1.6.
|
|
733
|
+
ORForise v1.6.2: Aggregate-Compare Run Parameters.
|
|
734
734
|
|
|
735
735
|
Required Arguments:
|
|
736
736
|
-dna GENOME_DNA Genome DNA file (.fa) which both annotations are based on
|
|
@@ -811,7 +811,7 @@ GFF-Adder combines two existing annotations (GFF or other tool formats).
|
|
|
811
811
|
For Help: ```GFF-Adder -h ```
|
|
812
812
|
|
|
813
813
|
```python
|
|
814
|
-
ORForise v1.6.
|
|
814
|
+
ORForise v1.6.2: GFF-Adder Run Parameters.
|
|
815
815
|
|
|
816
816
|
Required Arguments:
|
|
817
817
|
-dna GENOME_DNA Genome DNA file (.fa) which both annotations are based on
|
|
@@ -868,7 +868,7 @@ usage: Annotation_Intersector.py [-h] -ref REFERENCE_ANNOTATION -at
|
|
|
868
868
|
[-cov COVERAGE] [--report-discordance]
|
|
869
869
|
[--report-discordance-file REPORT_DISCORDANCE_FILE]
|
|
870
870
|
|
|
871
|
-
ORForise v1.6.
|
|
871
|
+
ORForise v1.6.2: Annotation-Intersector Run Parameters
|
|
872
872
|
|
|
873
873
|
options:
|
|
874
874
|
-h, --help show this help message and exit
|
|
@@ -947,7 +947,7 @@ Please report any issues to: https://github.com/NickJD/ORForise/issues
|
|
|
947
947
|
#####
|
|
948
948
|
usage: Convert_To_GFF.py [-h] [-dna GENOME_DNA] -i INPUT_ANNOTATION -fmt FORMAT -o OUTPUT_DIR [-gi GENE_IDENT] [--verbose]
|
|
949
949
|
|
|
950
|
-
ORForise v1.6.
|
|
950
|
+
ORForise v1.6.2: Convert-To-GFF Run Parameters
|
|
951
951
|
|
|
952
952
|
Required Arguments:
|
|
953
953
|
-dna GENOME_DNA Genome DNA file (.fa)
|
|
@@ -21,7 +21,7 @@ Example output files from ```Annotation-Compare```, ```Aggregate-Compare```, ```
|
|
|
21
21
|
For Help: ```Annotation-Compare -h ```
|
|
22
22
|
|
|
23
23
|
```python
|
|
24
|
-
ORForise v1.6.
|
|
24
|
+
ORForise v1.6.2: Annotatione-Compare Run Parameters.
|
|
25
25
|
|
|
26
26
|
Required Arguments:
|
|
27
27
|
-dna GENOME_DNA Genome DNA file (.fa) which both annotations are based on
|
|
@@ -89,7 +89,7 @@ ORForise can be used as the example below.
|
|
|
89
89
|
For Help: ```Aggregate-Compare -h ```
|
|
90
90
|
|
|
91
91
|
```python
|
|
92
|
-
ORForise v1.6.
|
|
92
|
+
ORForise v1.6.2: Aggregate-Compare Run Parameters.
|
|
93
93
|
|
|
94
94
|
Required Arguments:
|
|
95
95
|
-dna GENOME_DNA Genome DNA file (.fa) which both annotations are based on
|
|
@@ -170,7 +170,7 @@ GFF-Adder combines two existing annotations (GFF or other tool formats).
|
|
|
170
170
|
For Help: ```GFF-Adder -h ```
|
|
171
171
|
|
|
172
172
|
```python
|
|
173
|
-
ORForise v1.6.
|
|
173
|
+
ORForise v1.6.2: GFF-Adder Run Parameters.
|
|
174
174
|
|
|
175
175
|
Required Arguments:
|
|
176
176
|
-dna GENOME_DNA Genome DNA file (.fa) which both annotations are based on
|
|
@@ -227,7 +227,7 @@ usage: Annotation_Intersector.py [-h] -ref REFERENCE_ANNOTATION -at
|
|
|
227
227
|
[-cov COVERAGE] [--report-discordance]
|
|
228
228
|
[--report-discordance-file REPORT_DISCORDANCE_FILE]
|
|
229
229
|
|
|
230
|
-
ORForise v1.6.
|
|
230
|
+
ORForise v1.6.2: Annotation-Intersector Run Parameters
|
|
231
231
|
|
|
232
232
|
options:
|
|
233
233
|
-h, --help show this help message and exit
|
|
@@ -306,7 +306,7 @@ Please report any issues to: https://github.com/NickJD/ORForise/issues
|
|
|
306
306
|
#####
|
|
307
307
|
usage: Convert_To_GFF.py [-h] [-dna GENOME_DNA] -i INPUT_ANNOTATION -fmt FORMAT -o OUTPUT_DIR [-gi GENE_IDENT] [--verbose]
|
|
308
308
|
|
|
309
|
-
ORForise v1.6.
|
|
309
|
+
ORForise v1.6.2: Convert-To-GFF Run Parameters
|
|
310
310
|
|
|
311
311
|
Required Arguments:
|
|
312
312
|
-dna GENOME_DNA Genome DNA file (.fa)
|
|
@@ -2,14 +2,12 @@ from importlib import import_module
|
|
|
2
2
|
import argparse
|
|
3
3
|
import csv, os, gzip, sys
|
|
4
4
|
|
|
5
|
-
|
|
6
5
|
try:
|
|
7
|
-
from Comparator import tool_comparison
|
|
8
|
-
from utils import *
|
|
9
|
-
except ImportError:
|
|
10
6
|
from .Comparator import tool_comparison
|
|
11
7
|
from .utils import *
|
|
12
|
-
|
|
8
|
+
except (ImportError, ModuleNotFoundError):
|
|
9
|
+
from Comparator import tool_comparison
|
|
10
|
+
from utils import *
|
|
13
11
|
############################################
|
|
14
12
|
|
|
15
13
|
def comparator(options):
|
|
@@ -7,11 +7,12 @@ from datetime import datetime
|
|
|
7
7
|
|
|
8
8
|
|
|
9
9
|
try:
|
|
10
|
-
from utils import *
|
|
11
|
-
from Comparator import tool_comparison
|
|
12
|
-
except ImportError:
|
|
13
10
|
from .Comparator import tool_comparison
|
|
14
11
|
from .utils import *
|
|
12
|
+
except (ImportError, ModuleNotFoundError):
|
|
13
|
+
from Comparator import tool_comparison
|
|
14
|
+
from utils import *
|
|
15
|
+
|
|
15
16
|
|
|
16
17
|
##########################
|
|
17
18
|
|
|
@@ -11,9 +11,9 @@ if not logging.getLogger().handlers:
|
|
|
11
11
|
logging.basicConfig(stream=sys.stdout, level=logging.INFO, format='%(levelname)s: %(message)s')
|
|
12
12
|
|
|
13
13
|
try:
|
|
14
|
-
from utils import *
|
|
15
|
-
except ImportError:
|
|
16
14
|
from .utils import *
|
|
15
|
+
except (ImportError, ModuleNotFoundError):
|
|
16
|
+
from utils import *
|
|
17
17
|
|
|
18
18
|
################################
|
|
19
19
|
|
|
@@ -5,11 +5,13 @@ import os
|
|
|
5
5
|
import sys
|
|
6
6
|
|
|
7
7
|
try:
|
|
8
|
+
from .utils import *
|
|
9
|
+
from .Aux.TabToGFF.TabToGFF import TabToGFF
|
|
10
|
+
except (ImportError, ModuleNotFoundError):
|
|
8
11
|
from utils import *
|
|
9
12
|
from ORForise.src.ORForise.Aux.TabToGFF import TabToGFF
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
from ORForise.Aux.TabToGFF.TabToGFF import TabToGFF
|
|
13
|
+
|
|
14
|
+
|
|
13
15
|
|
|
14
16
|
|
|
15
17
|
def setup_logging(outdir, verbose=False):
|
|
@@ -6,9 +6,9 @@ from datetime import date
|
|
|
6
6
|
import sys
|
|
7
7
|
|
|
8
8
|
try:
|
|
9
|
-
from utils import *
|
|
10
|
-
except ImportError:
|
|
11
9
|
from .utils import *
|
|
10
|
+
except (ImportError, ModuleNotFoundError):
|
|
11
|
+
from utils import *
|
|
12
12
|
|
|
13
13
|
|
|
14
14
|
########################################
|
|
@@ -370,7 +370,7 @@ def gff_adder(options):
|
|
|
370
370
|
|
|
371
371
|
else:
|
|
372
372
|
# Reference tool provided: attempt to call it with dna_regions first (multi-contig aware), fallback to legacy signature
|
|
373
|
-
reference_tool = options.reference_tool if options.reference_tool != '
|
|
373
|
+
reference_tool = options.reference_tool if options.reference_tool != 'StORF-Reporter' else 'StORF-Reporter'
|
|
374
374
|
try:
|
|
375
375
|
reference_tool_mod = import_module('Tools.' + reference_tool + '.' + reference_tool, package='my_current_pkg')
|
|
376
376
|
except ModuleNotFoundError:
|
|
@@ -1,17 +1,10 @@
|
|
|
1
1
|
from importlib import import_module
|
|
2
|
-
import
|
|
3
|
-
import sys, os
|
|
4
|
-
import gzip, csv
|
|
5
|
-
import logging
|
|
6
|
-
from datetime import datetime
|
|
7
|
-
|
|
2
|
+
import os
|
|
8
3
|
|
|
9
4
|
try:
|
|
10
|
-
from utils import *
|
|
11
|
-
from Comparator import tool_comparison
|
|
12
|
-
except ImportError:
|
|
13
|
-
from .Comparator import tool_comparison
|
|
14
5
|
from .utils import *
|
|
6
|
+
except (ImportError, ModuleNotFoundError):
|
|
7
|
+
from utils import *
|
|
15
8
|
|
|
16
9
|
|
|
17
10
|
|
|
@@ -3,11 +3,11 @@ import argparse
|
|
|
3
3
|
import csv
|
|
4
4
|
|
|
5
5
|
try:
|
|
6
|
-
from utils import *
|
|
7
|
-
from Comparator import tool_comparison
|
|
8
|
-
except ImportError:
|
|
9
6
|
from .Comparator import tool_comparison
|
|
10
7
|
from .utils import *
|
|
8
|
+
except (ImportError, ModuleNotFoundError):
|
|
9
|
+
from Comparator import tool_comparison
|
|
10
|
+
from utils import *
|
|
11
11
|
|
|
12
12
|
###################
|
|
13
13
|
|
|
@@ -11,11 +11,23 @@ except ImportError:
|
|
|
11
11
|
def Augustus(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as Augustus_input:
|
|
17
|
+
for line in Augustus_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) == 10 and "CDS" in line[2] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
augustus_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
augustus_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
with open(tool_pred, 'r') as Augustus_input:
|
|
@@ -11,11 +11,23 @@ except ImportError:
|
|
|
11
11
|
def Balrog(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as Balrog_input:
|
|
17
|
+
for line in Balrog_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if "CDS" in line[2] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
Balrog_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
Balrog_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
|
|
@@ -11,11 +11,23 @@ except ImportError:
|
|
|
11
11
|
def FGENESB(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as FGENESB_input:
|
|
17
|
+
for line in FGENESB_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) == 10 and ">GENE" in line[0] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
FGENESB_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
FGENESB_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
with open(tool_pred, 'r') as FGENESB_input:
|
|
@@ -11,11 +11,23 @@ except ImportError:
|
|
|
11
11
|
def FragGeneScan(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as fragGeneScan_input:
|
|
17
|
+
for line in fragGeneScan_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) == 10 and "FGS" in line[1] and "CDS" in line[2] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
fragGeneScan_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
fragGeneScan_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
with open(tool_pred, 'r') as fragGeneScan_input:
|
|
@@ -1,5 +1,4 @@
|
|
|
1
1
|
import collections
|
|
2
|
-
import sys
|
|
3
2
|
try:
|
|
4
3
|
from utils import revCompIterative
|
|
5
4
|
from utils import sortORFs
|
|
@@ -11,11 +10,23 @@ except ImportError:
|
|
|
11
10
|
def GFF(*args):
|
|
12
11
|
tool_pred = args[0]
|
|
13
12
|
dna_regions = args[1]
|
|
13
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
14
|
+
dna_regions = collections.OrderedDict()
|
|
15
|
+
with open(tool_pred, 'r') as GFF_input:
|
|
16
|
+
for line in GFF_input:
|
|
17
|
+
line = line.split()
|
|
18
|
+
if 'CDS' in line[2] and len(line) == 9 and line[0] not in dna_regions:
|
|
19
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
20
|
+
return dna_regions
|
|
21
|
+
|
|
14
22
|
GFF_ORFs = collections.OrderedDict()
|
|
15
23
|
for dna_region in dna_regions:
|
|
16
24
|
GFF_ORFs[dna_region] = collections.OrderedDict()
|
|
17
25
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
26
|
+
try:
|
|
27
|
+
genome = dna_regions[dna_region][0]
|
|
28
|
+
except IndexError:
|
|
29
|
+
genome = dna_regions[dna_region]
|
|
19
30
|
genome_size = len(genome)
|
|
20
31
|
genome_rev = revCompIterative(genome)
|
|
21
32
|
with open(tool_pred, 'r') as gff_input:
|
|
@@ -11,11 +11,23 @@ except ImportError:
|
|
|
11
11
|
def GLIMMER_3(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as GLIMKMER_input:
|
|
17
|
+
for line in GLIMMER_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) == 5 and "orf" in line[0] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
GLIMMER_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
GLIMMER_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
with open(tool_pred,
|
|
@@ -10,11 +10,23 @@ except ImportError:
|
|
|
10
10
|
def GeneMark(*args):
|
|
11
11
|
tool_pred = args[0]
|
|
12
12
|
dna_regions = args[1]
|
|
13
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
14
|
+
dna_regions = collections.OrderedDict()
|
|
15
|
+
with open(tool_pred, 'r') as GeneMark_input:
|
|
16
|
+
for line in GeneMark_input:
|
|
17
|
+
line = line.split()
|
|
18
|
+
if 'direct' in line[2] or 'complement' in line[2] and line[0] not in dna_regions:
|
|
19
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
20
|
+
return dna_regions
|
|
21
|
+
|
|
13
22
|
geneMark_ORFs = collections.OrderedDict()
|
|
14
23
|
for dna_region in dna_regions:
|
|
15
24
|
geneMark_ORFs[dna_region] = collections.OrderedDict()
|
|
16
25
|
for dna_region in dna_regions:
|
|
17
|
-
|
|
26
|
+
try:
|
|
27
|
+
genome = dna_regions[dna_region][0]
|
|
28
|
+
except IndexError:
|
|
29
|
+
genome = dna_regions[dna_region]
|
|
18
30
|
genome_size = len(genome)
|
|
19
31
|
genome_rev = revCompIterative(genome)
|
|
20
32
|
prev_Start = 0
|
|
@@ -11,15 +11,27 @@ except ImportError:
|
|
|
11
11
|
def GeneMark_HA(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
-
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as GeneMarkHA_input:
|
|
17
|
+
for line in GeneMarkHA_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) >= 9 and "CDS" in line[5] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
23
|
+
geneMarkHA_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
|
-
|
|
25
|
+
geneMarkHA_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
|
-
with open(tool_pred, 'r') as
|
|
22
|
-
for line in
|
|
33
|
+
with open(tool_pred, 'r') as GeneMarkHA_input:
|
|
34
|
+
for line in GeneMarkHA_input:
|
|
23
35
|
line = line.split()
|
|
24
36
|
if len(line) >= 9 and "CDS" in line[5] and dna_region in line[0]:
|
|
25
37
|
start = int(line[6])
|
|
@@ -35,8 +47,8 @@ def GeneMark_HA(*args):
|
|
|
35
47
|
stopCodon = genome[stop - 3:stop]
|
|
36
48
|
po = str(start) + ',' + str(stop)
|
|
37
49
|
orf = [strand, startCodon, stopCodon, 'CDS', 'GeneMarkHA']
|
|
38
|
-
|
|
50
|
+
geneMarkHA_ORFs.update({po: orf})
|
|
39
51
|
|
|
40
|
-
for group in
|
|
41
|
-
|
|
42
|
-
return
|
|
52
|
+
for group in geneMarkHA_ORFs:
|
|
53
|
+
geneMarkHA_ORFs[group] = sortORFs(geneMarkHA_ORFs[group])
|
|
54
|
+
return geneMarkHA_ORFs
|
|
@@ -12,15 +12,27 @@ except ImportError:
|
|
|
12
12
|
def GeneMark_HMM(*args):
|
|
13
13
|
tool_pred = args[0]
|
|
14
14
|
dna_regions = args[1]
|
|
15
|
-
|
|
15
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
16
|
+
dna_regions = collections.OrderedDict()
|
|
17
|
+
with open(tool_pred, 'r') as GeneMarkHMM_input:
|
|
18
|
+
for line in GeneMarkHMM_input:
|
|
19
|
+
line = line.split()
|
|
20
|
+
if len(line) >= 9 and "CDS" in line[2] and line[0] not in dna_regions:
|
|
21
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
22
|
+
return dna_regions
|
|
23
|
+
|
|
24
|
+
geneMarkHMM_ORFs = collections.OrderedDict()
|
|
16
25
|
for dna_region in dna_regions:
|
|
17
|
-
|
|
26
|
+
geneMarkHMM_ORFs[dna_region] = collections.OrderedDict()
|
|
18
27
|
for dna_region in dna_regions:
|
|
19
|
-
|
|
28
|
+
try:
|
|
29
|
+
genome = dna_regions[dna_region][0]
|
|
30
|
+
except IndexError:
|
|
31
|
+
genome = dna_regions[dna_region]
|
|
20
32
|
genome_size = len(genome)
|
|
21
33
|
genome_rev = revCompIterative(genome)
|
|
22
|
-
with open(tool_pred, 'r') as
|
|
23
|
-
for line in
|
|
34
|
+
with open(tool_pred, 'r') as GeneMarkHMM_input:
|
|
35
|
+
for line in GeneMarkHMM_input:
|
|
24
36
|
line = line.split('\t')
|
|
25
37
|
if len(line) >= 9 and "CDS" in line[2] and dna_region in line[0]:
|
|
26
38
|
start = int(line[3])
|
|
@@ -35,9 +47,9 @@ def GeneMark_HMM(*args):
|
|
|
35
47
|
startCodon = genome[start - 1:start + 2]
|
|
36
48
|
stopCodon = genome[stop - 3:stop]
|
|
37
49
|
po = str(start) + ',' + str(stop)
|
|
38
|
-
orf = [strand, startCodon, stopCodon, 'CDS', '
|
|
39
|
-
|
|
50
|
+
orf = [strand, startCodon, stopCodon, 'CDS', 'GeneMarkHMM']
|
|
51
|
+
geneMarkHMM_ORFs.update({po: orf})
|
|
40
52
|
|
|
41
|
-
for group in
|
|
42
|
-
|
|
43
|
-
return
|
|
53
|
+
for group in geneMarkHMM_ORFs:
|
|
54
|
+
geneMarkHMM_ORFs[group] = sortORFs(geneMarkHMM_ORFs[group])
|
|
55
|
+
return geneMarkHMM_ORFs
|
|
@@ -11,15 +11,27 @@ except ImportError:
|
|
|
11
11
|
def GeneMark_S(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
-
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as GeneMarkS_input:
|
|
17
|
+
for line in GeneMarkS_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) >= 9 and "CDS" in line[5] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
23
|
+
geneMarkS_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
|
-
|
|
25
|
+
geneMarkS_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
|
-
with open(tool_pred, 'r') as
|
|
22
|
-
for line in
|
|
33
|
+
with open(tool_pred, 'r') as GeneMarkS_input:
|
|
34
|
+
for line in GeneMarkS_input:
|
|
23
35
|
line = line.split()
|
|
24
36
|
if len(line) >= 9 and "CDS" in line[5] and dna_region in line[0]:
|
|
25
37
|
start = int(line[6])
|
|
@@ -34,9 +46,9 @@ def GeneMark_S(*args):
|
|
|
34
46
|
startCodon = genome[start - 1:start + 2]
|
|
35
47
|
stopCodon = genome[stop - 3:stop]
|
|
36
48
|
po = str(start) + ',' + str(stop)
|
|
37
|
-
orf = [strand, startCodon, stopCodon, 'CDS', '
|
|
38
|
-
|
|
49
|
+
orf = [strand, startCodon, stopCodon, 'CDS', 'GeneMarkS']
|
|
50
|
+
geneMarkS_ORFs.update({po: orf})
|
|
39
51
|
|
|
40
|
-
for group in
|
|
41
|
-
|
|
42
|
-
return
|
|
52
|
+
for group in geneMarkS_ORFs:
|
|
53
|
+
geneMarkS_ORFs[group] = sortORFs(geneMarkS_ORFs[group])
|
|
54
|
+
return geneMarkS_ORFs
|
|
@@ -8,18 +8,30 @@ except ImportError:
|
|
|
8
8
|
from ORForise.utils import sortORFs
|
|
9
9
|
|
|
10
10
|
|
|
11
|
-
def
|
|
11
|
+
def GeneMarkS2(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
-
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as GeneMarkS2_input:
|
|
17
|
+
for line in GeneMarkS2_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) >= 9 and "CDS" in line[2] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
23
|
+
geneMarkS2_ORFs = collections.defaultdict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
|
-
|
|
25
|
+
geneMarkS2_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
|
-
with open(tool_pred, 'r') as
|
|
22
|
-
for line in
|
|
33
|
+
with open(tool_pred, 'r') as GeneMarkS2_input:
|
|
34
|
+
for line in GeneMarkS2_input:
|
|
23
35
|
line = line.split('\t')
|
|
24
36
|
if len(line) >= 9 and dna_region in line[0] and "CDS" in line[2]:
|
|
25
37
|
start = int(line[3])
|
|
@@ -35,9 +47,9 @@ def GeneMark_S_2(*args):
|
|
|
35
47
|
startCodon = genome[start - 1:start + 2]
|
|
36
48
|
stopCodon = genome[stop - 3:stop]
|
|
37
49
|
po = str(start) + ',' + str(stop)
|
|
38
|
-
orf = [strand, startCodon, stopCodon, 'CDS', '
|
|
39
|
-
|
|
50
|
+
orf = [strand, startCodon, stopCodon, 'CDS', 'GeneMarkS2']
|
|
51
|
+
geneMarkS2_ORFs[dna_region].update({po: orf})
|
|
40
52
|
|
|
41
|
-
for group in
|
|
42
|
-
|
|
43
|
-
return
|
|
53
|
+
for group in geneMarkS2_ORFs:
|
|
54
|
+
geneMarkS2_ORFs[group] = sortORFs(geneMarkS2_ORFs[group])
|
|
55
|
+
return geneMarkS2_ORFs
|
|
@@ -11,11 +11,23 @@ except ImportError:
|
|
|
11
11
|
def MetaGene(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as MetaGene_input:
|
|
17
|
+
for line in MetaGene_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) >= 6 and ("-" in line or '+' in line) and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
metaGene_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
metaGene_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
with open(tool_pred, 'r') as MetaGene_input:
|
|
@@ -11,11 +11,23 @@ except ImportError:
|
|
|
11
11
|
def MetaGeneAnnotator(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as MetaGeneAnnotator_input:
|
|
17
|
+
for line in MetaGeneAnnotator_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) == 11 and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
metaGeneAnnotator_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
metaGeneAnnotator_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
with open(tool_pred, 'r') as MetaGeneAnnotator_input:
|
|
@@ -11,11 +11,23 @@ except ImportError:
|
|
|
11
11
|
def MetaGeneMark(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as MetaGeneMark_input:
|
|
17
|
+
for line in MetaGeneMark_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if 'GeneMark.hmm' in line[4] and "CDS" in line[5] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
metaGeneMarkORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
metaGeneMarkORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
with open(tool_pred, 'r') as metaGeneMark_input:
|
|
@@ -13,10 +13,10 @@ def Prodigal(*args):
|
|
|
13
13
|
dna_regions = args[1]
|
|
14
14
|
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
15
|
dna_regions = collections.OrderedDict()
|
|
16
|
-
with open(tool_pred, 'r') as
|
|
17
|
-
for line in
|
|
16
|
+
with open(tool_pred, 'r') as Prodigal_input:
|
|
17
|
+
for line in Prodigal_input:
|
|
18
18
|
line = line.split()
|
|
19
|
-
if
|
|
19
|
+
if "Prodigal" in line[1] and "CDS" in line[2] and line[0] not in dna_regions:
|
|
20
20
|
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
21
|
return dna_regions
|
|
22
22
|
|
|
@@ -8,15 +8,27 @@ except ImportError:
|
|
|
8
8
|
from ORForise.utils import sortORFs
|
|
9
9
|
|
|
10
10
|
|
|
11
|
-
def Prokka(*args):
|
|
11
|
+
def Prokka(*args): # UNFINISHED
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
14
|
types = args[2]
|
|
15
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
16
|
+
dna_regions = collections.OrderedDict()
|
|
17
|
+
with open(tool_pred, 'r') as PROKKA_input:
|
|
18
|
+
for line in PROKKA_input:
|
|
19
|
+
line = line.split()
|
|
20
|
+
if "Prodigal" in line[1] and "CDS" in line[2] and line[0] not in dna_regions:
|
|
21
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
22
|
+
return dna_regions
|
|
23
|
+
|
|
15
24
|
prokkaORFs = collections.defaultdict(list)
|
|
16
25
|
for dna_region in dna_regions:
|
|
17
26
|
prokkaORFs[dna_region] = collections.OrderedDict()
|
|
18
27
|
for dna_region in dna_regions:
|
|
19
|
-
|
|
28
|
+
try:
|
|
29
|
+
genome = dna_regions[dna_region][0]
|
|
30
|
+
except IndexError:
|
|
31
|
+
genome = dna_regions[dna_region]
|
|
20
32
|
genome_size = len(genome)
|
|
21
33
|
genome_rev = revCompIterative(genome)
|
|
22
34
|
with open(tool_pred, 'r') as prodigal_input:
|
|
@@ -11,18 +11,30 @@ except ImportError:
|
|
|
11
11
|
def StORF_Reporter(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as StORF-Reporter_input:
|
|
17
|
+
for line in StORF-Reporter_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if 'StORF-Reporter' in line[1] or 'StoRF_Reporter' in line[1] or 'StORF' in line[1] or 'StORF-Reporter' in line[1] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
storf_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
storf_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
with open(tool_pred, 'r') as storf_input:
|
|
22
34
|
for line in storf_input:
|
|
23
35
|
if not line.startswith('#') and not line.startswith('\n'):
|
|
24
36
|
line = line.split()
|
|
25
|
-
if '
|
|
37
|
+
if 'StORF-Reporter' in line[1] or 'StoRF_Reporter' in line[1] or 'StORF' in line[1] or 'StORF-Reporter' in line[1] and dna_region in line[0]: # need to harmonise this.
|
|
26
38
|
start = int(line[3])
|
|
27
39
|
stop = int(line[4])
|
|
28
40
|
strand = line[6]
|
|
@@ -11,11 +11,23 @@ except ImportError:
|
|
|
11
11
|
def TransDecoder(*args):
|
|
12
12
|
tool_pred = args[0]
|
|
13
13
|
dna_regions = args[1]
|
|
14
|
+
if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
|
|
15
|
+
dna_regions = collections.OrderedDict()
|
|
16
|
+
with open(tool_pred, 'r') as TransDecoder_input:
|
|
17
|
+
for line in TransDecoder_input:
|
|
18
|
+
line = line.split()
|
|
19
|
+
if len(line) == 9 and "transdecoder" in line[1] and "CDS" in line[2] and line[0] not in dna_regions:
|
|
20
|
+
dna_regions[line[0]] = [] # Placeholder for genome sequence
|
|
21
|
+
return dna_regions
|
|
22
|
+
|
|
14
23
|
transDecoder_ORFs = collections.OrderedDict()
|
|
15
24
|
for dna_region in dna_regions:
|
|
16
25
|
transDecoder_ORFs[dna_region] = collections.OrderedDict()
|
|
17
26
|
for dna_region in dna_regions:
|
|
18
|
-
|
|
27
|
+
try:
|
|
28
|
+
genome = dna_regions[dna_region][0]
|
|
29
|
+
except IndexError:
|
|
30
|
+
genome = dna_regions[dna_region]
|
|
19
31
|
genome_size = len(genome)
|
|
20
32
|
genome_rev = revCompIterative(genome)
|
|
21
33
|
with open(tool_pred, 'r') as transDecoder_Input:
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: ORForise
|
|
3
|
-
Version: 1.6.
|
|
3
|
+
Version: 1.6.2
|
|
4
4
|
Summary: ORForise - A platform for analysing and comparing genome annotations.
|
|
5
5
|
Author-email: Nicholas Dimonaco <nicholas@dimonaco.co.uk>
|
|
6
6
|
License: GNU GENERAL PUBLIC LICENSE
|
|
@@ -662,7 +662,7 @@ Example output files from ```Annotation-Compare```, ```Aggregate-Compare```, ```
|
|
|
662
662
|
For Help: ```Annotation-Compare -h ```
|
|
663
663
|
|
|
664
664
|
```python
|
|
665
|
-
ORForise v1.6.
|
|
665
|
+
ORForise v1.6.2: Annotatione-Compare Run Parameters.
|
|
666
666
|
|
|
667
667
|
Required Arguments:
|
|
668
668
|
-dna GENOME_DNA Genome DNA file (.fa) which both annotations are based on
|
|
@@ -730,7 +730,7 @@ ORForise can be used as the example below.
|
|
|
730
730
|
For Help: ```Aggregate-Compare -h ```
|
|
731
731
|
|
|
732
732
|
```python
|
|
733
|
-
ORForise v1.6.
|
|
733
|
+
ORForise v1.6.2: Aggregate-Compare Run Parameters.
|
|
734
734
|
|
|
735
735
|
Required Arguments:
|
|
736
736
|
-dna GENOME_DNA Genome DNA file (.fa) which both annotations are based on
|
|
@@ -811,7 +811,7 @@ GFF-Adder combines two existing annotations (GFF or other tool formats).
|
|
|
811
811
|
For Help: ```GFF-Adder -h ```
|
|
812
812
|
|
|
813
813
|
```python
|
|
814
|
-
ORForise v1.6.
|
|
814
|
+
ORForise v1.6.2: GFF-Adder Run Parameters.
|
|
815
815
|
|
|
816
816
|
Required Arguments:
|
|
817
817
|
-dna GENOME_DNA Genome DNA file (.fa) which both annotations are based on
|
|
@@ -868,7 +868,7 @@ usage: Annotation_Intersector.py [-h] -ref REFERENCE_ANNOTATION -at
|
|
|
868
868
|
[-cov COVERAGE] [--report-discordance]
|
|
869
869
|
[--report-discordance-file REPORT_DISCORDANCE_FILE]
|
|
870
870
|
|
|
871
|
-
ORForise v1.6.
|
|
871
|
+
ORForise v1.6.2: Annotation-Intersector Run Parameters
|
|
872
872
|
|
|
873
873
|
options:
|
|
874
874
|
-h, --help show this help message and exit
|
|
@@ -947,7 +947,7 @@ Please report any issues to: https://github.com/NickJD/ORForise/issues
|
|
|
947
947
|
#####
|
|
948
948
|
usage: Convert_To_GFF.py [-h] [-dna GENOME_DNA] -i INPUT_ANNOTATION -fmt FORMAT -o OUTPUT_DIR [-gi GENE_IDENT] [--verbose]
|
|
949
949
|
|
|
950
|
-
ORForise v1.6.
|
|
950
|
+
ORForise v1.6.2: Convert-To-GFF Run Parameters
|
|
951
951
|
|
|
952
952
|
Required Arguments:
|
|
953
953
|
-dna GENOME_DNA Genome DNA file (.fa)
|
|
@@ -53,12 +53,12 @@ src/ORForise/Tools/GeneMark/GeneMark.py
|
|
|
53
53
|
src/ORForise/Tools/GeneMark/__init__.py
|
|
54
54
|
src/ORForise/Tools/GeneMarkHA/GeneMarkHA.py
|
|
55
55
|
src/ORForise/Tools/GeneMarkHA/__init__.py
|
|
56
|
-
src/ORForise/Tools/
|
|
57
|
-
src/ORForise/Tools/
|
|
58
|
-
src/ORForise/Tools/
|
|
59
|
-
src/ORForise/Tools/
|
|
60
|
-
src/ORForise/Tools/
|
|
61
|
-
src/ORForise/Tools/
|
|
56
|
+
src/ORForise/Tools/GeneMarkHMM/GeneMarkHMM.py
|
|
57
|
+
src/ORForise/Tools/GeneMarkHMM/__init__.py
|
|
58
|
+
src/ORForise/Tools/GeneMarkS/GeneMarkS.py
|
|
59
|
+
src/ORForise/Tools/GeneMarkS/__init__.py
|
|
60
|
+
src/ORForise/Tools/GeneMarkS2/GeneMarkS2.py
|
|
61
|
+
src/ORForise/Tools/GeneMarkS2/__init__.py
|
|
62
62
|
src/ORForise/Tools/MetaGene/MetaGene.py
|
|
63
63
|
src/ORForise/Tools/MetaGene/__init__.py
|
|
64
64
|
src/ORForise/Tools/MetaGeneAnnotator/MetaGeneAnnotator.py
|
|
@@ -69,7 +69,7 @@ src/ORForise/Tools/Prodigal/Prodigal.py
|
|
|
69
69
|
src/ORForise/Tools/Prodigal/__init__.py
|
|
70
70
|
src/ORForise/Tools/Prokka/Prokka.py
|
|
71
71
|
src/ORForise/Tools/Prokka/__init__.py
|
|
72
|
-
src/ORForise/Tools/
|
|
73
|
-
src/ORForise/Tools/
|
|
72
|
+
src/ORForise/Tools/StORF-Reporter/StORF-Reporter.py
|
|
73
|
+
src/ORForise/Tools/StORF-Reporter/__init__.py
|
|
74
74
|
src/ORForise/Tools/TransDecoder/TransDecoder.py
|
|
75
75
|
src/ORForise/Tools/TransDecoder/__init__.py
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{orforise-1.6.1 → orforise-1.6.2}/src/ORForise/Aux/StORF_Undetected/unvitiated_Genes/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/hypothetical_gene_predictions.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{orforise-1.6.1 → orforise-1.6.2}/src/ORForise/ORForise_Analysis/start_Codon_Substitution.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|