PyamilySeq 1.3.1__py3-none-any.whl → 1.3.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- PyamilySeq/{Cluster_Compare.py → Group_Compare.py} +27 -13
- PyamilySeq/Group_Extractor.py +29 -12
- PyamilySeq/Group_Sizes.py +22 -8
- PyamilySeq/Group_Splitter.py +89 -29
- PyamilySeq/{Cluster_Summary.py → Group_Summary.py} +18 -20
- PyamilySeq/PyamilySeq.py +66 -43
- PyamilySeq/PyamilySeq_Genus.py +1 -1
- PyamilySeq/PyamilySeq_Species.py +30 -63
- PyamilySeq/Seq_Combiner.py +125 -15
- PyamilySeq/Seq_Extractor.py +24 -2
- PyamilySeq/Seq_Finder.py +20 -2
- PyamilySeq/clusterings.py +1 -1
- PyamilySeq/constants.py +142 -1
- PyamilySeq/utils.py +171 -84
- {pyamilyseq-1.3.1.dist-info → pyamilyseq-1.3.3.dist-info}/METADATA +14 -14
- pyamilyseq-1.3.3.dist-info/RECORD +21 -0
- {pyamilyseq-1.3.1.dist-info → pyamilyseq-1.3.3.dist-info}/WHEEL +1 -1
- {pyamilyseq-1.3.1.dist-info → pyamilyseq-1.3.3.dist-info}/entry_points.txt +4 -4
- PyamilySeq/config.py +0 -0
- pyamilyseq-1.3.1.dist-info/RECORD +0 -22
- {pyamilyseq-1.3.1.dist-info → pyamilyseq-1.3.3.dist-info}/licenses/LICENSE +0 -0
- {pyamilyseq-1.3.1.dist-info → pyamilyseq-1.3.3.dist-info}/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: PyamilySeq
|
|
3
|
-
Version: 1.3.
|
|
3
|
+
Version: 1.3.3
|
|
4
4
|
Summary: PyamilySeq - A a tool to investigate sequence-based gene groups identified by clustering methods such as CD-HIT, DIAMOND, BLAST or MMseqs2.
|
|
5
5
|
Author-email: Nicholas Dimonaco <nicholas@dimonaco.co.uk>
|
|
6
6
|
License: GNU GENERAL PUBLIC LICENSE
|
|
@@ -720,7 +720,7 @@ To update to the newest version add '-U' to end of the pip install command.
|
|
|
720
720
|
```commandline
|
|
721
721
|
usage: PyamilySeq.py [-h] {Full,Partial} ...
|
|
722
722
|
|
|
723
|
-
PyamilySeq v1.3.
|
|
723
|
+
PyamilySeq v1.3.3: A tool for gene clustering and analysis.
|
|
724
724
|
|
|
725
725
|
positional arguments:
|
|
726
726
|
{Full,Partial} Choose a mode: 'Full' or 'Partial'.
|
|
@@ -750,7 +750,7 @@ Escherichia_coli_110957|ENSB_TIZS9kbTvShDvyX Escherichia_coli_110957|ENSB_TIZS9k
|
|
|
750
750
|
```
|
|
751
751
|
### Example output:
|
|
752
752
|
```
|
|
753
|
-
Running PyamilySeq v1.3.
|
|
753
|
+
Running PyamilySeq v1.3.3
|
|
754
754
|
Calculating Groups
|
|
755
755
|
Number of Genomes: 10
|
|
756
756
|
Gene Groups
|
|
@@ -805,7 +805,7 @@ Total Number of First Gene Groups That Had Additional Second Sequences But Not N
|
|
|
805
805
|
## PyamilySeq is separated into two main 'run modes', Full and Partial. They each have their own set of required and optional arguments.
|
|
806
806
|
### PyamilySeq - Full Menu:
|
|
807
807
|
```
|
|
808
|
-
usage: PyamilySeq.py Full [-h] -output_dir OUTPUT_DIR -input_type {separate,combined,fasta} [-input_dir INPUT_DIR] [-input_fasta INPUT_FASTA] [-name_split_gff NAME_SPLIT_GFF] [-name_split_fasta NAME_SPLIT_FASTA] [-
|
|
808
|
+
usage: PyamilySeq.py Full [-h] -output_dir OUTPUT_DIR -input_type {separate,combined,fasta} [-input_dir INPUT_DIR] [-input_fasta INPUT_FASTA] [-name_split_gff NAME_SPLIT_GFF] [-name_split_fasta NAME_SPLIT_FASTA] [-seq_type {AA,DNA}] [-gene_ident GENE_IDENT] [-c PIDENT] [-s LEN_DIFF] [-fast_mode]
|
|
809
809
|
[-group_mode {Species,Genus}] [-species_groups SPECIES_GROUPS] [-genus_groups GENUS_GROUPS] [-write_groups WRITE_GROUPS] [-write_individual_groups] [-align] [-align_aa] [-no_gpa] [-M MEM] [-T THREADS] [-verbose] [-v]
|
|
810
810
|
|
|
811
811
|
options:
|
|
@@ -821,7 +821,7 @@ options:
|
|
|
821
821
|
Substring to split filenames and extract genome names for gff files (e.g., '_combined.gff3') - Use with -input_type separate/combined.
|
|
822
822
|
-name_split_fasta NAME_SPLIT_FASTA
|
|
823
823
|
Substring to split filenames and extract genome names for fasta files if named differently to paired gff files (e.g., '_dna.fasta') - Use with -input_type separate/combined.
|
|
824
|
-
-
|
|
824
|
+
-seq_type {AA,DNA}
|
|
825
825
|
Clustering mode: 'DNA' or 'AA'.
|
|
826
826
|
-gene_ident GENE_IDENT
|
|
827
827
|
Gene identifiers to extract sequences (e.g., 'CDS, tRNA').
|
|
@@ -895,7 +895,7 @@ Seq-Combiner -input_dir .../test_data/genomes -name_split_gff .gff3 -output_dir
|
|
|
895
895
|
```
|
|
896
896
|
usage: Seq_Combiner.py [-h] -input_dir INPUT_DIR -input_type {separate,combined,fasta} [-name_split_gff NAME_SPLIT_GFF] [-name_split_fasta NAME_SPLIT_FASTA] -output_dir OUTPUT_DIR -output_name OUTPUT_FILE [-gene_ident GENE_IDENT] [-translate] [-v]
|
|
897
897
|
|
|
898
|
-
PyamilySeq v1.3.
|
|
898
|
+
PyamilySeq v1.3.3: Seq-Combiner - A tool to extract sequences from GFF/FASTA files and prepare them for PyamilySeq.
|
|
899
899
|
|
|
900
900
|
options:
|
|
901
901
|
-h, --help show this help message and exit
|
|
@@ -927,18 +927,18 @@ Misc Arguments:
|
|
|
927
927
|
## Group-Splitter: This tool can split multi-copy gene groups using CD-HIT after initial PyamilySeq analysis.
|
|
928
928
|
### Example:
|
|
929
929
|
```bash
|
|
930
|
-
Group-Splitter -genome_num 10 -input_fasta .../test/species/ -output_dir .../test/species/ -
|
|
930
|
+
Group-Splitter -genome_num 10 -input_fasta .../test/species/ -output_dir .../test/species/ -seq_type AA
|
|
931
931
|
```
|
|
932
932
|
### Group-Splitter Menu:
|
|
933
933
|
```
|
|
934
|
-
usage: Group_Splitter.py [-h] -input_fasta INPUT_FASTA -
|
|
934
|
+
usage: Group_Splitter.py [-h] -input_fasta INPUT_FASTA -seq_type {AA,DNA}
|
|
935
935
|
-genome_num GENOME_NUM -output_dir OUTPUT_DIR
|
|
936
936
|
[-groups GROUPS] [-group_threshold GROUP_THRESHOLD]
|
|
937
937
|
[-c PIDENT] [-s LEN_DIFF] [-T CLUSTERING_THREADS]
|
|
938
938
|
[-M CLUSTERING_MEMORY] [-no_delete_temp_files]
|
|
939
939
|
[-verbose] [-v]
|
|
940
940
|
|
|
941
|
-
PyamilySeq v1.3.
|
|
941
|
+
PyamilySeq v1.3.3: Group-Splitter - A tool to split multi-copy gene groups
|
|
942
942
|
identified by PyamilySeq.
|
|
943
943
|
|
|
944
944
|
options:
|
|
@@ -947,7 +947,7 @@ options:
|
|
|
947
947
|
Required Parameters:
|
|
948
948
|
-input_fasta INPUT_FASTA
|
|
949
949
|
Input FASTA file containing gene groups.
|
|
950
|
-
-
|
|
950
|
+
-seq_type {AA,DNA}
|
|
951
951
|
Default - DNA: Are groups "DNA" or "AA" sequences?
|
|
952
952
|
-genome_num GENOME_NUM
|
|
953
953
|
The total number of genomes must be provide
|
|
@@ -981,17 +981,17 @@ Misc Parameters:
|
|
|
981
981
|
|
|
982
982
|
```
|
|
983
983
|
|
|
984
|
-
##
|
|
984
|
+
## Group-Summary menu: This tool can be used to summarise CD-HIT .clstr files:
|
|
985
985
|
### Example:
|
|
986
986
|
```bash
|
|
987
|
-
|
|
987
|
+
Group-Summary -genome_num 10 -input_clstr .../test_data/species/E-coli/E-coli_extracted_pep_cd-hit_80.clstr -output_tsv .../test_data/species/E-coli/E-coli_extracted_pep_cd-hit_80_Summary.tsv
|
|
988
988
|
```
|
|
989
|
-
###
|
|
989
|
+
### Group-Summary Menu:
|
|
990
990
|
```
|
|
991
991
|
usage: Cluster_Summary.py [-h] -input_clstr INPUT_CLSTR -output OUTPUT -genome_num GENOME_NUM
|
|
992
992
|
[-output_dir OUTPUT_DIR] [-verbose] [-v]
|
|
993
993
|
|
|
994
|
-
PyamilySeq v1.3.
|
|
994
|
+
PyamilySeq v1.3.3: Group-Summary - A tool to summarise CD-HIT clustering files.
|
|
995
995
|
|
|
996
996
|
options:
|
|
997
997
|
-h, --help show this help message and exit
|
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
PyamilySeq/Group_Compare.py,sha256=6GdJdrdMqsSG87xR1GZs2ddog1y9onlPaxq0Jt240oM,5460
|
|
2
|
+
PyamilySeq/Group_Extractor.py,sha256=FSeCY2z01GTSd--uWZpNEmddaLZizDNrjvcOnicuB_4,4153
|
|
3
|
+
PyamilySeq/Group_Sizes.py,sha256=VmJQ_DGJUO4fbrBGVq1eG6HypkjylVcwKvBB0w0CTTU,4075
|
|
4
|
+
PyamilySeq/Group_Splitter.py,sha256=iA2-_GA_9_wgALe307xKphQJRQ34sepYjS_lESamtxM,30069
|
|
5
|
+
PyamilySeq/Group_Summary.py,sha256=1CfzsmnVLLP1c8RGvfYprBFnMaAUqeUz6e-mEJ-P460,7529
|
|
6
|
+
PyamilySeq/PyamilySeq.py,sha256=Odt5Qpz9jX_8-CsIs4vQlU8DyxM_Xhhjx68mOg0M9wE,19231
|
|
7
|
+
PyamilySeq/PyamilySeq_Genus.py,sha256=5E3gDLp6lD8sSR8fepAVmxZJoP-dIeF0y9y7-gE24tM,12470
|
|
8
|
+
PyamilySeq/PyamilySeq_Species.py,sha256=vkeIViMFSwjBdQ2fF_J9yP3M3Y4jc3k3jHp5gnsqt6c,22327
|
|
9
|
+
PyamilySeq/Seq_Combiner.py,sha256=q6nU90oCdZdPaaPanPONvCiOg6RepUmZuPmFXld1aRs,10768
|
|
10
|
+
PyamilySeq/Seq_Extractor.py,sha256=PWVYHC6pyAdd_1evkbOgGsEoOvV3bPYLDoYpwYTQUAs,4497
|
|
11
|
+
PyamilySeq/Seq_Finder.py,sha256=IF4yuc3w2kpSZgaYDJJYODhIsEOND1IubsAxxdTTahk,3089
|
|
12
|
+
PyamilySeq/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
13
|
+
PyamilySeq/clusterings.py,sha256=73k3Ffu3lVG0NTU2lqiTFU4L7TF3tipNK5P-q4XpkAY,22374
|
|
14
|
+
PyamilySeq/constants.py,sha256=8DjqzKkB32OsgEjUrVbMzFMTlhJ8N8v0sZdoFMyCqyM,6470
|
|
15
|
+
PyamilySeq/utils.py,sha256=woFCv9l93drNGOQ_Ekg7wiHoU2eHq4_9WWErmm76Szs,37104
|
|
16
|
+
pyamilyseq-1.3.3.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
|
|
17
|
+
pyamilyseq-1.3.3.dist-info/METADATA,sha256=yEVExWk6mTp8etYfJtsFiJyXAM7Oh4chk6Xhifz8MME,58533
|
|
18
|
+
pyamilyseq-1.3.3.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
|
|
19
|
+
pyamilyseq-1.3.3.dist-info/entry_points.txt,sha256=1P7oCXW1ONiy6LvGZ_Z6LPGDGcCIsZs7r0BIEtP_rmQ,830
|
|
20
|
+
pyamilyseq-1.3.3.dist-info/top_level.txt,sha256=J6JhugUQTq4rq96yibAlQu3o4KCM9WuYfqr3w1r119M,11
|
|
21
|
+
pyamilyseq-1.3.3.dist-info/RECORD,,
|
|
@@ -1,17 +1,17 @@
|
|
|
1
1
|
[console_scripts]
|
|
2
|
-
|
|
3
|
-
Cluster-Summary = PyamilySeq.Cluster_Summary:main
|
|
2
|
+
Group-Extractor = PyamilySeq.Group_Extractor:main
|
|
4
3
|
Group-Splitter = PyamilySeq.Group_Splitter:main
|
|
4
|
+
Group-Summary = PyamilySeq.Group_Summary:main
|
|
5
5
|
PyamilySeq = PyamilySeq.PyamilySeq:main
|
|
6
6
|
Seq-Combiner = PyamilySeq.Seq_Combiner:main
|
|
7
7
|
Seq-Extractor = PyamilySeq.Seq_Extractor:main
|
|
8
8
|
Seq-Finder = PyamilySeq.Seq_Finder:main
|
|
9
|
-
cluster-extractor = PyamilySeq.Cluster_Extractor:main
|
|
10
|
-
cluster-summary = PyamilySeq.Cluster_Summary:main
|
|
11
9
|
compare-contree-singletrees = aux_tools.RF.compare_contree_singletrees:main
|
|
12
10
|
compare-rf = aux_tools.RF.compare_RF:main
|
|
13
11
|
compute-singletrees-rf = aux_tools.RF.Compute_SingleTree_RFs:main
|
|
12
|
+
group-extractor = PyamilySeq.Group_Extractor:main
|
|
14
13
|
group-splitter = PyamilySeq.Group_Splitter:main
|
|
14
|
+
group-summary = PyamilySeq.Group_Summary:main
|
|
15
15
|
pyamilyseq = PyamilySeq.PyamilySeq:main
|
|
16
16
|
seq-combiner = PyamilySeq.Seq_Combiner:main
|
|
17
17
|
seq-extractor = PyamilySeq.Seq_Extractor:main
|
PyamilySeq/config.py
DELETED
|
File without changes
|
|
@@ -1,22 +0,0 @@
|
|
|
1
|
-
PyamilySeq/Cluster_Compare.py,sha256=2jRXBYN8T9TUDLV9bj3SWFQ2pBUH3BAKW1FYrDYSQBw,4421
|
|
2
|
-
PyamilySeq/Cluster_Summary.py,sha256=efXMfGvATERCTxwaqbauhZwt_5Hrf9KpGKY3EgsHVDk,6720
|
|
3
|
-
PyamilySeq/Group_Extractor.py,sha256=oe2VmOVxdvTmAcy8NKwD1F27IdN2utAfczxsyxg96yc,2898
|
|
4
|
-
PyamilySeq/Group_Sizes.py,sha256=3snkAN19o3Y4IY6IqSim1qy415FfQe1Wb8vzWTKF0Wo,3028
|
|
5
|
-
PyamilySeq/Group_Splitter.py,sha256=OcMj9GnAyybs_DaNKRyvfL_nl2dB2gUI4BD_EQrBbWo,25653
|
|
6
|
-
PyamilySeq/PyamilySeq.py,sha256=vc_mFuK-Cmqa3elusyIg5DksTHxdwCcFv2ki2ACqXIA,17468
|
|
7
|
-
PyamilySeq/PyamilySeq_Genus.py,sha256=KUC0QkCRpKQ9HEgxyTSD7Nc63wSXtriWyIqt_YOy5ys,12470
|
|
8
|
-
PyamilySeq/PyamilySeq_Species.py,sha256=1P_xbdUrZPykyS44KFyRdyxU-XPX_yKLpJhjhB8VTpg,24029
|
|
9
|
-
PyamilySeq/Seq_Combiner.py,sha256=G49zthWtsTfqYX1tqc7op9a9cSia1IL0VTiAtwgdTwc,4746
|
|
10
|
-
PyamilySeq/Seq_Extractor.py,sha256=IQk4Qn6LJkPXD1O4TQesneS3_ZN8hBsTVZQGlZ1c-Dk,3072
|
|
11
|
-
PyamilySeq/Seq_Finder.py,sha256=ht-fSQ_opWKydcoWI9D3nTwLt6Rpgevnf2y0KxVjw4M,1881
|
|
12
|
-
PyamilySeq/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
13
|
-
PyamilySeq/clusterings.py,sha256=bfST7_i6qnj9ogclmOSkQhurZaEWBBq0H48FAN7JpOg,22374
|
|
14
|
-
PyamilySeq/config.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
15
|
-
PyamilySeq/constants.py,sha256=rjAhz3KZ8STrueOdZOBvWKZUALDJM0y3QrTZGDE88JU,31
|
|
16
|
-
PyamilySeq/utils.py,sha256=1U794Xd5qzmaIz2VujdnPkND729kr7rKjei0Y57f-QE,32972
|
|
17
|
-
pyamilyseq-1.3.1.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
|
|
18
|
-
pyamilyseq-1.3.1.dist-info/METADATA,sha256=-6Y4VzMdNpsQ7O4WB_xJ6Mxa9y0qovhrbYOwwPeahjQ,58566
|
|
19
|
-
pyamilyseq-1.3.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
20
|
-
pyamilyseq-1.3.1.dist-info/entry_points.txt,sha256=5RkUWIneXu-kCnClJhv0u27lWHAoyoVmospZMU5Cs2U,846
|
|
21
|
-
pyamilyseq-1.3.1.dist-info/top_level.txt,sha256=J6JhugUQTq4rq96yibAlQu3o4KCM9WuYfqr3w1r119M,11
|
|
22
|
-
pyamilyseq-1.3.1.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|