mgnify-pipelines-toolkit 1.1.2__tar.gz → 1.2.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of mgnify-pipelines-toolkit might be problematic. Click here for more details.
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/PKG-INFO +6 -6
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/antismash_gff_builder.py +24 -27
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit.egg-info/PKG-INFO +6 -6
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit.egg-info/requires.txt +1 -1
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/pyproject.toml +3 -3
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/LICENSE +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/README.md +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/__init__.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/__init__.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/amplicon_utils.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/are_there_primers.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/assess_inflection_point_mcp.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/assess_mcp_proportions.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/classify_var_regions.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/find_mcp_inflection_points.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/make_asv_count_table.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/mapseq_to_asv_table.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/primer_val_classification.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/remove_ambiguous_reads.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/rev_comp_se_primers.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/standard_primer_matching.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/amplicon/study_summary_generator.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/add_rhea_chebi_annotation.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/combined_gene_caller_merge.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/generate_gaf.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/gff_annotation_utils.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/gff_file_utils.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/gff_toolkit.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/go_utils.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/krona_txt_from_cat_classification.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/process_dbcan_result_cazys.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/process_dbcan_result_clusters.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/study_summary_generator.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/summarise_antismash_bgcs.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/summarise_goslims.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/assembly/summarise_sanntis_bgcs.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/genomes/__init__.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/shared/__init__.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/shared/convert_cmscan_to_cmsearch_tblout.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/shared/dwc_summary_generator.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/shared/fastq_suffix_header_check.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/shared/get_subunits.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/shared/get_subunits_coords.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/shared/library_strategy_check.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/shared/mapseq2biom.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/analysis/shared/markergene_study_summary.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/constants/db_labels.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/constants/ncrna.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/constants/regex_ambiguous_bases.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/constants/regex_fasta_header.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/constants/tax_ranks.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/constants/thresholds.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/constants/var_region_coordinates.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/schemas/schemas.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/utils/__init__.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/utils/fasta_to_delimited.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit/utils/get_mpt_version.py +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit.egg-info/SOURCES.txt +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit.egg-info/dependency_links.txt +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit.egg-info/entry_points.txt +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/mgnify_pipelines_toolkit.egg-info/top_level.txt +0 -0
- {mgnify_pipelines_toolkit-1.1.2 → mgnify_pipelines_toolkit-1.2.0}/setup.cfg +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: mgnify_pipelines_toolkit
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.2.0
|
|
4
4
|
Summary: Collection of scripts and tools for MGnify pipelines
|
|
5
5
|
Author-email: MGnify team <metagenomics-help@ebi.ac.uk>
|
|
6
6
|
License: Apache Software License 2.0
|
|
@@ -8,7 +8,7 @@ Keywords: bioinformatics,pipelines,metagenomics
|
|
|
8
8
|
Classifier: Programming Language :: Python :: 3
|
|
9
9
|
Classifier: License :: OSI Approved :: Apache Software License
|
|
10
10
|
Classifier: Operating System :: OS Independent
|
|
11
|
-
Requires-Python: >=3.
|
|
11
|
+
Requires-Python: >=3.11
|
|
12
12
|
Description-Content-Type: text/markdown
|
|
13
13
|
License-File: LICENSE
|
|
14
14
|
Requires-Dist: biopython>=1.85
|
|
@@ -20,10 +20,10 @@ Requires-Dist: click<9,>=8.1.8
|
|
|
20
20
|
Requires-Dist: pandera<0.24,>=0.23.1
|
|
21
21
|
Requires-Dist: pyfastx<3,>=2.2.0
|
|
22
22
|
Requires-Dist: intervaltree<4,>=3.1.0
|
|
23
|
-
Provides-Extra:
|
|
24
|
-
Requires-Dist: pytest<9,>=8.3.5; extra == "
|
|
25
|
-
Requires-Dist: pytest-md>=0.2.0; extra == "
|
|
26
|
-
Requires-Dist: pytest-workflow==2.1.0; extra == "
|
|
23
|
+
Provides-Extra: test
|
|
24
|
+
Requires-Dist: pytest<9,>=8.3.5; extra == "test"
|
|
25
|
+
Requires-Dist: pytest-md>=0.2.0; extra == "test"
|
|
26
|
+
Requires-Dist: pytest-workflow==2.1.0; extra == "test"
|
|
27
27
|
Provides-Extra: dev
|
|
28
28
|
Requires-Dist: pre-commit>=4.2.0; extra == "dev"
|
|
29
29
|
Requires-Dist: black>=25.1.0; extra == "dev"
|
|
@@ -22,7 +22,6 @@ import pandas as pd
|
|
|
22
22
|
|
|
23
23
|
|
|
24
24
|
def parse_args():
|
|
25
|
-
|
|
26
25
|
parser = argparse.ArgumentParser()
|
|
27
26
|
parser.add_argument(
|
|
28
27
|
"-i", "--input", required=True, type=str, help="Input JSON from antiSMASH"
|
|
@@ -64,7 +63,6 @@ def main():
|
|
|
64
63
|
region_name = None
|
|
65
64
|
|
|
66
65
|
for feature in record["features"]:
|
|
67
|
-
|
|
68
66
|
if feature["type"] == "region":
|
|
69
67
|
# Annotate region features
|
|
70
68
|
region_name = (
|
|
@@ -129,35 +127,34 @@ def main():
|
|
|
129
127
|
cds_by_protocluster = record["modules"][
|
|
130
128
|
"antismash.detection.hmm_detection"
|
|
131
129
|
]["rule_results"]["cds_by_protocluster"]
|
|
132
|
-
|
|
133
|
-
|
|
134
|
-
|
|
135
|
-
|
|
136
|
-
|
|
137
|
-
|
|
130
|
+
|
|
131
|
+
if not cds_by_protocluster:
|
|
132
|
+
continue
|
|
133
|
+
|
|
134
|
+
for feature in cds_by_protocluster[0][1]:
|
|
135
|
+
if locus_tag := feature.get("cds_name"):
|
|
136
|
+
as_clusters = ",".join(list(feature["definition_domains"].keys()))
|
|
137
|
+
if locus_tag in attributes_dict:
|
|
138
|
+
attributes_dict[locus_tag].update(
|
|
139
|
+
{"as_gene_clusters": as_clusters}
|
|
138
140
|
)
|
|
139
|
-
if locus_tag in attributes_dict.keys():
|
|
140
|
-
attributes_dict[locus_tag].update(
|
|
141
|
-
{"as_gene_clusters": as_clusters}
|
|
142
|
-
)
|
|
143
141
|
|
|
144
142
|
if "antismash.detection.genefunctions" in record["modules"].keys():
|
|
145
|
-
|
|
146
|
-
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
154
|
-
|
|
155
|
-
|
|
143
|
+
gene_function_tools = record["modules"][
|
|
144
|
+
"antismash.detection.genefunctions"
|
|
145
|
+
]["tools"]
|
|
146
|
+
if tool_data := gene_function_tools.get("smcogs"):
|
|
147
|
+
|
|
148
|
+
for locus_tag in tool_data["best_hits"]:
|
|
149
|
+
smcog_id = tool_data["best_hits"][locus_tag]["reference_id"]
|
|
150
|
+
smcog_description = tool_data["best_hits"][locus_tag]["description"]
|
|
151
|
+
|
|
152
|
+
score = tool_data["best_hits"][locus_tag]["bitscore"]
|
|
153
|
+
e_value = tool_data["best_hits"][locus_tag]["evalue"]
|
|
156
154
|
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
|
|
160
|
-
break
|
|
155
|
+
smcog_note = f"smCOG:{smcog_id}:{smcog_description.replace(' ', '_')}(Score:{score}%3BE-value:{e_value})"
|
|
156
|
+
if locus_tag in attributes_dict.keys():
|
|
157
|
+
attributes_dict[locus_tag].update({"as_notes": smcog_note})
|
|
161
158
|
|
|
162
159
|
attributes = [
|
|
163
160
|
";".join(f"{k}={v}" for k, v in attrib_data.items() if v)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: mgnify_pipelines_toolkit
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.2.0
|
|
4
4
|
Summary: Collection of scripts and tools for MGnify pipelines
|
|
5
5
|
Author-email: MGnify team <metagenomics-help@ebi.ac.uk>
|
|
6
6
|
License: Apache Software License 2.0
|
|
@@ -8,7 +8,7 @@ Keywords: bioinformatics,pipelines,metagenomics
|
|
|
8
8
|
Classifier: Programming Language :: Python :: 3
|
|
9
9
|
Classifier: License :: OSI Approved :: Apache Software License
|
|
10
10
|
Classifier: Operating System :: OS Independent
|
|
11
|
-
Requires-Python: >=3.
|
|
11
|
+
Requires-Python: >=3.11
|
|
12
12
|
Description-Content-Type: text/markdown
|
|
13
13
|
License-File: LICENSE
|
|
14
14
|
Requires-Dist: biopython>=1.85
|
|
@@ -20,10 +20,10 @@ Requires-Dist: click<9,>=8.1.8
|
|
|
20
20
|
Requires-Dist: pandera<0.24,>=0.23.1
|
|
21
21
|
Requires-Dist: pyfastx<3,>=2.2.0
|
|
22
22
|
Requires-Dist: intervaltree<4,>=3.1.0
|
|
23
|
-
Provides-Extra:
|
|
24
|
-
Requires-Dist: pytest<9,>=8.3.5; extra == "
|
|
25
|
-
Requires-Dist: pytest-md>=0.2.0; extra == "
|
|
26
|
-
Requires-Dist: pytest-workflow==2.1.0; extra == "
|
|
23
|
+
Provides-Extra: test
|
|
24
|
+
Requires-Dist: pytest<9,>=8.3.5; extra == "test"
|
|
25
|
+
Requires-Dist: pytest-md>=0.2.0; extra == "test"
|
|
26
|
+
Requires-Dist: pytest-workflow==2.1.0; extra == "test"
|
|
27
27
|
Provides-Extra: dev
|
|
28
28
|
Requires-Dist: pre-commit>=4.2.0; extra == "dev"
|
|
29
29
|
Requires-Dist: black>=25.1.0; extra == "dev"
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[project]
|
|
2
2
|
name = "mgnify_pipelines_toolkit"
|
|
3
|
-
version = "1.
|
|
3
|
+
version = "1.2.0"
|
|
4
4
|
readme = "README.md"
|
|
5
5
|
license = { text = "Apache Software License 2.0" }
|
|
6
6
|
authors = [
|
|
@@ -8,7 +8,7 @@ authors = [
|
|
|
8
8
|
]
|
|
9
9
|
keywords = ["bioinformatics", "pipelines", "metagenomics"]
|
|
10
10
|
description = "Collection of scripts and tools for MGnify pipelines"
|
|
11
|
-
requires-python = ">=3.
|
|
11
|
+
requires-python = ">=3.11"
|
|
12
12
|
classifiers = [
|
|
13
13
|
"Programming Language :: Python :: 3",
|
|
14
14
|
"License :: OSI Approved :: Apache Software License",
|
|
@@ -89,7 +89,7 @@ fasta_to_delimited = "mgnify_pipelines_toolkit.utils.fasta_to_delimited:main"
|
|
|
89
89
|
get_mpt_version = "mgnify_pipelines_toolkit.utils.get_mpt_version:main"
|
|
90
90
|
|
|
91
91
|
[project.optional-dependencies]
|
|
92
|
-
|
|
92
|
+
test = [
|
|
93
93
|
"pytest>=8.3.5,<9",
|
|
94
94
|
"pytest-md>=0.2.0",
|
|
95
95
|
"pytest-workflow==2.1.0",
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|