PyPI - XspecT - Versions diffs - 0.1.3__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

XspecT 0.1.3py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of XspecT might be problematic. Click here for more details.

Files changed (58) hide show

{XspecT-0.1.3.dist-info → XspecT-0.2.0.dist-info}/METADATA +23 -29
XspecT-0.2.0.dist-info/RECORD +30 -0
{XspecT-0.1.3.dist-info → XspecT-0.2.0.dist-info}/WHEEL +1 -1
xspect/definitions.py +42 -0
xspect/download_filters.py +11 -26
xspect/fastapi.py +101 -0
xspect/file_io.py +34 -103
xspect/main.py +70 -66
xspect/model_management.py +88 -0
xspect/models/__init__.py +0 -0
xspect/models/probabilistic_filter_model.py +277 -0
xspect/models/probabilistic_filter_svm_model.py +169 -0
xspect/models/probabilistic_single_filter_model.py +109 -0
xspect/models/result.py +148 -0
xspect/pipeline.py +201 -0
xspect/run.py +38 -0
xspect/train.py +304 -0
xspect/train_filter/create_svm.py +6 -183
xspect/train_filter/extract_and_concatenate.py +117 -121
xspect/train_filter/html_scrap.py +16 -28
xspect/train_filter/ncbi_api/download_assemblies.py +7 -8
xspect/train_filter/ncbi_api/ncbi_assembly_metadata.py +9 -17
xspect/train_filter/ncbi_api/ncbi_children_tree.py +3 -2
xspect/train_filter/ncbi_api/ncbi_taxon_metadata.py +7 -5
XspecT-0.1.3.dist-info/RECORD +0 -49
xspect/BF_v2.py +0 -637
xspect/Bootstrap.py +0 -29
xspect/Classifier.py +0 -142
xspect/OXA_Table.py +0 -53
xspect/WebApp.py +0 -724
xspect/XspecT_mini.py +0 -1363
xspect/XspecT_trainer.py +0 -611
xspect/map_kmers.py +0 -155
xspect/search_filter.py +0 -504
xspect/static/How-To.png +0 -0
xspect/static/Logo.png +0 -0
xspect/static/Logo2.png +0 -0
xspect/static/Workflow_AspecT.png +0 -0
xspect/static/Workflow_ClAssT.png +0 -0
xspect/static/js.js +0 -615
xspect/static/main.css +0 -280
xspect/templates/400.html +0 -64
xspect/templates/401.html +0 -62
xspect/templates/404.html +0 -62
xspect/templates/500.html +0 -62
xspect/templates/about.html +0 -544
xspect/templates/home.html +0 -51
xspect/templates/layoutabout.html +0 -87
xspect/templates/layouthome.html +0 -63
xspect/templates/layoutspecies.html +0 -468
xspect/templates/species.html +0 -33
xspect/train_filter/README_XspecT_Erweiterung.md +0 -119
xspect/train_filter/get_paths.py +0 -35
xspect/train_filter/interface_XspecT.py +0 -204
xspect/train_filter/k_mer_count.py +0 -162
{XspecT-0.1.3.dist-info → XspecT-0.2.0.dist-info}/LICENSE +0 -0
{XspecT-0.1.3.dist-info → XspecT-0.2.0.dist-info}/entry_points.txt +0 -0
{XspecT-0.1.3.dist-info → XspecT-0.2.0.dist-info}/top_level.txt +0 -0

xspect/Classifier.py DELETED Viewed

@@ -1,142 +0,0 @@
-from sklearn.svm import SVC
-import csv
-from copy import deepcopy
-def cut_csv(csv_file, lst, table=False):
-    """Returns desired data from Training_data"""
-    r = csv.reader(open(csv_file))
-    m = list(r)
-    selected = deepcopy(lst)
-    header = m[0]
-    m = m[1:]
-    labels = header[1:-1]
-    X_train = []
-    y_train = []
-    files = []
-    if selected[8] and len(header[8:-1]) > 0:
-        # Added Genomes selected
-        del selected[8]
-        selected = selected + ([True] * len(header[9:-1]))
-    else:
-        # Added Genomes not selected
-        del selected[8]
-        selected = selected + ([False] * len(header[9:-1]))
-    # creating matrix
-    for i in range(len(m)):
-        X_train.append(m[i][1:-1])
-        y_train.append(m[i][-1])
-        files.append(m[i][0])
-    # Deleting Cols
-    for i in range(len(X_train)):
-        for j in range(len(X_train[i]) - 1, -1, -1):
-            if selected[j]:
-                pass
-            else:
-                del X_train[i][j]
-    # Deleting Rows
-    valid = ["None"]
-    for i in range(len(selected)):
-        if selected[i]:
-            valid.append(labels[i])
-    for i in range(len(X_train) - 1, -1, -1):
-        if y_train[i] not in valid:
-            del y_train[i]
-            del X_train[i]
-            del files[i]
-    if table:
-        # Inserting Infos for Table
-        for i in range(len(X_train)):
-            X_train[i].insert(0, files[i])
-            X_train[i].append(y_train[i])
-        for i in range(len(header) - 1, -1, -1):
-            if header[i] not in valid:
-                del header[i]
-        header.insert(0, "File")
-        header.append("Label")
-        X_train.insert(0, header)
-    else:
-        pass
-    return X_train, y_train
-def cut_csv_spec(csv_file):
-    """Returns svm Training_data"""
-    # read the training-data
-    r = csv.reader(open(csv_file))
-    m = list(r)
-    header = m[0]
-    m = m[1:]
-    X_train = []
-    y_train = []
-    # creating matrix as input for the classifier
-    for i in range(len(m)):
-        X_train.append(m[i][1:-1])
-        y_train.append(m[i][-1])
-    return X_train, y_train
-def classify(csv_file, result, lst):
-    """Classifys Result-vector and calculates needed vectors"""
-    r = csv.reader(open(csv_file))
-    m = list(r)
-    # deciding which kernel-function will be used
-    if m[0][1] == "IC1":
-        mode = "ClAssT"
-        X_train, y_train = cut_csv(csv_file, lst)
-        svm = SVC(kernel="poly", C=1.0).fit(X_train, y_train)
-    else:
-        mode = "XspecT"
-        X_train, y_train = cut_csv_spec(csv_file)
-        svm = SVC(kernel="rbf", C=1.5).fit(X_train, y_train)
-    # perform a prediction using the svm
-    prediction = svm.predict([result])
-    if mode == "XspecT":
-        if max(result) < 0.3:
-            prediction = ["sp.", 0]
-    else:
-        if max(result) < 0.3:
-            prediction = ["None", 0]
-    return prediction[0]
-def IC3_classify(result_2):
-    ic = "International Clonetype 3 (ST32 or ST250)"
-    m_3 = [
-        ["GCF_000278625.1", 1.0, ic],
-        ["GCF_001674185.1", 0.86, ic],
-        ["fictional", 0.85, "NONE of the selected Clonetypes or Genomes"],
-        ["fictional", 0.01, "NONE of the selected Clonetypes or Genomes"],
-    ]
-    X = []
-    y = []
-    for i in range(len(m_3)):
-        X.append(m_3[i][1])
-        y.append(m_3[i][2])
-    for i in range(len(X)):
-        X[i] = [X[i]]
-    svm_IC3 = SVC(kernel="poly", C=1).fit(X, y)
-    return svm_IC3.predict([result_2]), result_2[0]
-# https://scikit-learn.org/stable/modules/generated/sklearn.preprocessing.StandardScaler.html

xspect/OXA_Table.py DELETED Viewed

@@ -1,53 +0,0 @@
-import json
-from Bio import SeqIO
-import os
-class OXATable:
-    def __init__(self):
-        self.kmere = {}
-        self.total = 0
-        self.found = 0
-    def create_table(self, directory):
-        """Reads in fasta file, creates Dictionary with k-mer counter"""
-        # taking all fasta files for one big table
-        oxas = {}
-        files = os.listdir(directory)
-        for i in range(len(files)):
-            kmere = {}
-            file = directory + files[i]
-            for sequence in SeqIO.parse(file, "fasta"):
-                for j in range(0, len(sequence.seq) - 20 + 1):
-                    kmer = str(sequence.seq[j : j + 20])
-                    count = kmere.get(kmer, 0)
-                    kmere[kmer] = count + 1
-            oxas[files[i][:-6]] = kmere
-    def lookup(self, gene, kmer):
-        """Tests if kmer in dictionary, if so: reduces the counter"""
-        # Only returns True if kmer has been found and there was one left
-        if kmer in self.kmere[gene]:
-            if self.kmere[gene][kmer] > 0:
-                self.kmere[gene][kmer] -= 1
-                return True
-            else:
-                return False
-        else:
-            return False
-    def save_dic(self, path):
-        """writes dictionary to file using json"""
-        json.dump(self.kmere, open(path, "w"))
-    def read_dic(self, path):
-        """Reads dictionary from file using json"""
-        self.kmere = json.load(open(path))
-    def cleanup(self):
-        self.kmere = {}
-    def get_counter(self, path=r"filter/OXAs_dict/counter.txt"):
-        counter = json.load(open(path))
-        return counter

XspecT 0.1.3__py3-none-any.whl → 0.2.0__py3-none-any.whl

Potentially problematic release.

XspecT 0.1.3py3-none-any.whl → 0.2.0py3-none-any.whl