mgnify-pipelines-toolkit 0.1.6__tar.gz → 0.1.8__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mgnify-pipelines-toolkit might be problematic. Click here for more details.

Files changed (39) hide show
  1. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/PKG-INFO +1 -1
  2. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/make_asv_count_table.py +3 -1
  3. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/primer_val_classification.py +6 -4
  4. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/shared/get_subunits.py +1 -1
  5. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit.egg-info/PKG-INFO +1 -1
  6. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/pyproject.toml +1 -1
  7. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/LICENSE +0 -0
  8. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/README.md +0 -0
  9. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/__init__.py +0 -0
  10. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/__init__.py +0 -0
  11. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/amplicon_utils.py +0 -0
  12. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/are_there_primers.py +0 -0
  13. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/assess_inflection_point_mcp.py +0 -0
  14. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/assess_mcp_proportions.py +0 -0
  15. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/classify_var_regions.py +0 -0
  16. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/find_mcp_inflection_points.py +0 -0
  17. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/mapseq_to_asv_table.py +0 -0
  18. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/remove_ambiguous_reads.py +0 -0
  19. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/rev_comp_se_primers.py +0 -0
  20. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/amplicon/standard_primer_matching.py +0 -0
  21. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/shared/__init__.py +0 -0
  22. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/shared/fastq_suffix_header_check.py +0 -0
  23. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/shared/get_subunits_coords.py +0 -0
  24. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/shared/library_strategy_check.py +0 -0
  25. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/analysis/shared/mapseq2biom.py +0 -0
  26. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/constants/regex_ambiguous_bases.py +0 -0
  27. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/constants/regex_fasta_header.py +0 -0
  28. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/constants/tax_ranks.py +0 -0
  29. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/constants/thresholds.py +0 -0
  30. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/constants/var_region_coordinates.py +0 -0
  31. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/utils/__init__.py +0 -0
  32. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/utils/fasta_to_delimited.py +0 -0
  33. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit/utils/get_mpt_version.py +0 -0
  34. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit.egg-info/SOURCES.txt +0 -0
  35. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit.egg-info/dependency_links.txt +0 -0
  36. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit.egg-info/entry_points.txt +0 -0
  37. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit.egg-info/requires.txt +0 -0
  38. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/mgnify_pipelines_toolkit.egg-info/top_level.txt +0 -0
  39. {mgnify_pipelines_toolkit-0.1.6 → mgnify_pipelines_toolkit-0.1.8}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: mgnify_pipelines_toolkit
3
- Version: 0.1.6
3
+ Version: 0.1.8
4
4
  Summary: Collection of scripts and tools for MGnify pipelines
5
5
  Author-email: MGnify team <metagenomics-help@ebi.ac.uk>
6
6
  License: Apache Software License 2.0
@@ -277,6 +277,8 @@ def main():
277
277
  taxa_df = taxa_df.fillna("0")
278
278
  taxa_df = order_df(taxa_df)
279
279
 
280
+ asv_list = taxa_df.ASV.to_list()
281
+
280
282
  amp_reads = [read.strip() for read in list(open(amp, "r"))]
281
283
  headers = [read.split(" ")[0][1:] for read in list(open(headers, "r"))]
282
284
  amp_region = ".".join(amp.split(".")[1:3])
@@ -288,7 +290,7 @@ def main():
288
290
  counter += 1
289
291
  line_fwd = line_fwd.strip()
290
292
 
291
- if line_fwd == "0":
293
+ if line_fwd == "0" or f"seq_{line_fwd}" not in asv_list:
292
294
  continue
293
295
 
294
296
  if headers[counter] in amp_reads:
@@ -58,19 +58,20 @@ def parse_args():
58
58
  return input, fasta, sample
59
59
 
60
60
 
61
- def get_amp_region(beg, strand, model):
61
+ def get_amp_region(beg, end, strand, model):
62
62
  prev_region = ""
63
63
 
64
64
  for region, region_coords in model.items():
65
65
 
66
66
  region_beg = region_coords[0]
67
67
  beg_diff = region_beg - beg
68
+ end_diff = region_beg - end
68
69
 
69
70
  if strand == STRAND_FWD:
70
- if beg_diff > 0:
71
+ if beg_diff > 0 and end_diff > 0:
71
72
  return region
72
73
  else:
73
- if beg_diff > 0:
74
+ if beg_diff > 0 and end_diff > 0:
74
75
  return prev_region
75
76
 
76
77
  prev_region = region
@@ -92,6 +93,7 @@ def main():
92
93
  primer_name = line_lst[0]
93
94
  rfam = line_lst[3]
94
95
  beg = float(line_lst[5])
96
+ end = float(line_lst[6])
95
97
 
96
98
  if rfam == "RF00177":
97
99
  gene = "16S"
@@ -116,7 +118,7 @@ def main():
116
118
  elif "R" in primer_name:
117
119
  strand = STRAND_REV
118
120
 
119
- amp_region = get_amp_region(beg, strand, model)
121
+ amp_region = get_amp_region(beg, end, strand, model)
120
122
  primer_seq = str(fasta_dict[primer_name].seq)
121
123
 
122
124
  res_dict["Gene"].append(gene)
@@ -102,7 +102,7 @@ def main():
102
102
  ]
103
103
  open_files = {}
104
104
  for record in SeqIO.parse(args.input, "fasta"):
105
- model = "-".join(record.id.split("/")[0].split("-")[1:])
105
+ model = "-".join(record.id.split("/")[0].split("-")[-1:])
106
106
  if model in coding_rna:
107
107
  filename = pattern_dict[model]
108
108
  else:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: mgnify_pipelines_toolkit
3
- Version: 0.1.6
3
+ Version: 0.1.8
4
4
  Summary: Collection of scripts and tools for MGnify pipelines
5
5
  Author-email: MGnify team <metagenomics-help@ebi.ac.uk>
6
6
  License: Apache Software License 2.0
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "mgnify_pipelines_toolkit"
3
- version = "0.1.6"
3
+ version = "0.1.8"
4
4
  readme = "README.md"
5
5
  license = {text = "Apache Software License 2.0"}
6
6
  authors = [