mgnify-pipelines-toolkit 0.1.3__tar.gz → 0.1.4__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mgnify-pipelines-toolkit might be problematic. Click here for more details.

Files changed (33) hide show
  1. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/PKG-INFO +1 -1
  2. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/make_asv_count_table.py +24 -14
  3. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit.egg-info/PKG-INFO +1 -1
  4. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/pyproject.toml +1 -1
  5. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/LICENSE +0 -0
  6. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/README.md +0 -0
  7. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/__init__.py +0 -0
  8. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/__init__.py +0 -0
  9. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/amplicon_utils.py +0 -0
  10. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/are_there_primers.py +0 -0
  11. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/assess_inflection_point_mcp.py +0 -0
  12. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/assess_mcp_proportions.py +0 -0
  13. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/classify_var_regions.py +0 -0
  14. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/find_mcp_inflection_points.py +0 -0
  15. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/mapseq_to_asv_table.py +0 -0
  16. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/primer_val_classification.py +0 -0
  17. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/remove_ambiguous_reads.py +0 -0
  18. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/rev_comp_se_primers.py +0 -0
  19. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/amplicon/standard_primer_matching.py +0 -0
  20. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/shared/__init__.py +0 -0
  21. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/shared/get_subunits.py +0 -0
  22. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/shared/get_subunits_coords.py +0 -0
  23. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/analysis/shared/mapseq2biom.py +0 -0
  24. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/constants/regex_ambiguous_bases.py +0 -0
  25. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/constants/tax_ranks.py +0 -0
  26. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/constants/thresholds.py +0 -0
  27. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit/constants/var_region_coordinates.py +0 -0
  28. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit.egg-info/SOURCES.txt +0 -0
  29. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit.egg-info/dependency_links.txt +0 -0
  30. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit.egg-info/entry_points.txt +0 -0
  31. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit.egg-info/requires.txt +0 -0
  32. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/mgnify_pipelines_toolkit.egg-info/top_level.txt +0 -0
  33. {mgnify_pipelines_toolkit-0.1.3 → mgnify_pipelines_toolkit-0.1.4}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: mgnify_pipelines_toolkit
3
- Version: 0.1.3
3
+ Version: 0.1.4
4
4
  Summary: Collection of scripts and tools for MGnify pipelines
5
5
  Author-email: MGnify team <metagenomics-help@ebi.ac.uk>
6
6
  License: Apache Software License 2.0
@@ -223,6 +223,25 @@ def make_tax_assignment_dict_pr2(taxa_df, asv_dict):
223
223
 
224
224
  return tax_assignment_dict
225
225
 
226
+ def generate_asv_count_dict(asv_dict):
227
+
228
+ res_dict = defaultdict(list)
229
+
230
+ for asv_id, count in asv_dict.items():
231
+
232
+ if count == 0:
233
+ continue
234
+
235
+ res_dict['asv'].append(asv_id)
236
+ res_dict['count'].append(count)
237
+
238
+ res_df = pd.DataFrame.from_dict(res_dict)
239
+ res_df = res_df.sort_values(by='asv', ascending=True)
240
+ res_df = res_df.sort_values(by='count', ascending=False)
241
+
242
+ return res_df
243
+
244
+
226
245
  def main():
227
246
  _TAXA, _FWD, _REV, _AMP, _HEADERS, _SAMPLE = parse_args()
228
247
 
@@ -250,23 +269,12 @@ def main():
250
269
  for line_fwd in fwd_fr:
251
270
  counter += 1
252
271
  line_fwd = line_fwd.strip()
253
- fwd_asvs = line_fwd.split(",")
254
272
 
255
- if paired_end:
256
- line_rev = next(rev_fr).strip()
257
- rev_asvs = line_rev.split(",")
258
- asv_intersection = list(set(fwd_asvs).intersection(rev_asvs))
259
-
260
- if len(asv_intersection) == 0:
261
- continue
262
-
263
- if len(asv_intersection) == 1 and asv_intersection[0] == "0":
264
- continue
265
- else:
266
- asv_intersection = fwd_asvs
273
+ if line_fwd == '0':
274
+ continue
267
275
 
268
276
  if headers[counter] in amp_reads:
269
- asv_dict[f"seq_{int(asv_intersection[0]) - 1}"] += 1
277
+ asv_dict[f"seq_{line_fwd}"] += 1
270
278
 
271
279
  fwd_fr.close()
272
280
  if paired_end:
@@ -285,6 +293,8 @@ def main():
285
293
  for tax_assignment, count in tax_assignment_dict.items():
286
294
  fw.write(f"{count}\t{tax_assignment}\n")
287
295
 
296
+ asv_count_df = generate_asv_count_dict(asv_dict)
297
+ asv_count_df.to_csv(f'./{_SAMPLE}_{amp_region}_asv_read_counts.tsv', sep='\t', index=False)
288
298
 
289
299
  if __name__ == "__main__":
290
300
  main()
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: mgnify_pipelines_toolkit
3
- Version: 0.1.3
3
+ Version: 0.1.4
4
4
  Summary: Collection of scripts and tools for MGnify pipelines
5
5
  Author-email: MGnify team <metagenomics-help@ebi.ac.uk>
6
6
  License: Apache Software License 2.0
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "mgnify_pipelines_toolkit"
3
- version = "0.1.3"
3
+ version = "0.1.4"
4
4
  readme = "README.md"
5
5
  license = {text = "Apache Software License 2.0"}
6
6
  authors = [