PyPI - ORForise - Versions diffs - 1.6.2__py3-none-any.whl → 1.6.4__py3-none-any.whl - Mend

ORForise 1.6.2py3-none-any.whl → 1.6.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

ORForise/Aggregate_Compare.py +7 -4
ORForise/Annotation_Compare.py +7 -4
ORForise/Annotation_Intersector.py +89 -76
ORForise/Convert_To_GFF.py +7 -3
ORForise/GFF_Adder.py +7 -4
ORForise/List_Tools.py +7 -4
ORForise/StORForise.py +7 -2
ORForise/Tools/GFF/GFF.py +2 -2
ORForise/Tools/StORF-Reporter/StORF-Reporter.py +2 -2
ORForise/utils.py +2 -2
{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/METADATA +7 -7
{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/RECORD +16 -16
{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/WHEEL +1 -1
{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/entry_points.txt +0 -0
{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/licenses/LICENSE +0 -0
{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/top_level.txt +0 -0

ORForise/Aggregate_Compare.py CHANGED Viewed

@@ -337,7 +337,6 @@ def comparator(options):
 def main():
-    print(WELCOME)
     parser = argparse.ArgumentParser(description='ORForise ' + ORForise_Version + ': Aggregate-Compare Run Parameters.')
     parser._action_groups.pop()
@@ -373,6 +372,10 @@ def main():
     comparator(options)
 if __name__ == "__main__":
-    main()
-    print("Complete")
+    try:
+        try:
+            main()
+        except Exception:
+            print('Unhandled exception in main')
+    finally:
+        print(CLOSING)

ORForise/Annotation_Compare.py CHANGED Viewed

@@ -259,8 +259,6 @@ def comparator(options):
 def main():
-    print(WELCOME)
     parser = argparse.ArgumentParser(description='ORForise ' + ORForise_Version + ': Annotatione-Compare Run Parameters.')
     parser._action_groups.pop()
@@ -313,5 +311,10 @@ def main():
     comparator(options)
 if __name__ == "__main__":
-    main()
-    print("Complete")
+    try:
+        try:
+            main()
+        except Exception:
+            logging.exception('Unhandled exception in main')
+    finally:
+        print(CLOSING)

ORForise/Annotation_Intersector.py CHANGED Viewed

@@ -26,13 +26,12 @@ def gff_writer(genome_ID, genome_DNA, reference_annotation, reference_tool, ref_
     if out_dir:
         os.makedirs(out_dir, exist_ok=True)
-    # Always open the file and write the header first. Use a broad try so we can log any issue.
     try:
         with open(output_file, 'w', encoding='utf-8') as write_out:
             write_out.write("##gff-version\t3\n#\tAnnotation-Intersector\n#\tRun Date:" + str(date.today()) + '\n')
             if genome_DNA:
                 write_out.write("##Genome DNA File:" + genome_DNA + '\n')
-            write_out.write("##Original File: " + reference_annotation + "\n##Intersecting File: " + additional_annotation + '\n')
+            write_out.write("##Original File: " + (reference_annotation or '') + "\n##Intersecting File: " + (additional_annotation or '') + '\n')
             entries_written = 0
@@ -43,7 +42,7 @@ def gff_writer(genome_ID, genome_DNA, reference_annotation, reference_tool, ref_
                 # Parse reference annotation and write features matching gene_ident
                 try:
-                    if reference_annotation.endswith('.gz'):
+                    if reference_annotation and reference_annotation.endswith('.gz'):
                         rf = gzip.open(reference_annotation, 'rt')
                     else:
                         rf = open(reference_annotation, 'r', encoding='unicode_escape')
@@ -68,10 +67,11 @@ def gff_writer(genome_ID, genome_DNA, reference_annotation, reference_tool, ref_
                                 stop = parts[4]
                                 strand = parts[6]
                                 info = parts[8]
+                                source = parts[1] if len(parts) > 1 else ''
                             except Exception:
                                 continue
-                            # write entry with coverage 0 and empty additional annotation
-                            entry = f"{seqid}\t{os.path.splitext(os.path.basename(reference_annotation))[0]}\t{ftype}\t{start}\t{stop}\t.\t{strand}\t.\tID=Original_Annotation={info};Additional_Annotation=;Coverage=0\n"
+                            # write entry with coverage 0 and empty additional annotation; use source from input GFF
+                            entry = f"{seqid}\t{source}\t{ftype}\t{start}\t{stop}\t.\t{strand}\t.\tID=Original_Annotation={info}\n"
                             write_out.write(entry)
                             entries_written += 1
                 except Exception as e:
@@ -81,25 +81,26 @@ def gff_writer(genome_ID, genome_DNA, reference_annotation, reference_tool, ref_
                 logging.info('Wrote %d fallback reference entries to %s', entries_written, output_file)
                 return
+            # Iterate contigs and write kept entries. Kept entry layout expected:
+            # [strand, coverage, additional_type, ref_type, additional_info, ref_info, ref_source]
             for contig, genes in genes_To_Keep_by_contig.items():
-                # Use basename without extension for the source field
-                ref = os.path.splitext(os.path.basename(reference_annotation))[0].split('_')[0]
+                fallback_source = os.path.splitext(os.path.basename(reference_annotation))[0].split('_')[0] if reference_annotation else 'reference'
                 for pos, data in genes.items():
                     try:
                         pos_ = pos.split(',')
                         start = pos_[0]
                         stop = pos_[-1]
-                        strand = data[0]
-                        # Ensure indices exist and are strings
+                        strand = data[0] if len(data) > 0 else '.'
                         add_ann = str(data[4]) if len(data) > 4 else ''
                         orig_ann = str(data[5]) if len(data) > 5 else ''
+                        source_field = data[6] if len(data) > 6 and data[6] else fallback_source
+                        feat_type = data[3] if len(data) > 3 and data[3] else (data[2] if len(data) > 2 else 'CDS')
                         entry = (
-                            contig + '\t' + ref + '\t' + data[2] + '\t' + start + '\t' + stop + '\t.\t' + strand + '\t.\tID=Original_Annotation=' + orig_ann + ';Additional_Annotation=' + add_ann + ';Coverage=' + str(
+                            contig + '\t' + source_field + '\t' + feat_type + '\t' + start + '\t' + stop + '\t.\t' + strand + '\t.\tID=Original_Annotation=' + orig_ann + ';Additional_Annotation=' + add_ann + ';Coverage=' + str(
                                 data[1]) + '\n')
                         write_out.write(entry)
                         entries_written += 1
                     except Exception as e:
-                        # Log the bad entry and continue
                         logging.warning('Skipping bad GFF entry for contig %s pos %s: %s', contig, pos, e)
                         continue
@@ -179,7 +180,9 @@ def _write_discordance_report(report_path, entries):
 def _write_discordance_gff(report_path, entries, reference_annotation_basename):
-    """Write a list of discordance entries (dicts) to a GFF file."""
+    """Write a list of discordance entries (dicts) to a GFF file.
+    The GFF source column is taken from carried 'ref_source' or 'add_source' when available.
+    """
     report_path = os.path.expanduser(report_path)
     out_dir = os.path.dirname(report_path)
     if out_dir:
@@ -189,40 +192,35 @@ def _write_discordance_gff(report_path, entries, reference_annotation_basename):
             fh.write('##gff-version\t3\n')
             fh.write('#\tAnnotation-Intersector discordance report\n')
             fh.write('#\tRun Date:' + str(date.today()) + '\n')
-            fh.write('##Original File: ' + reference_annotation_basename + '\n')
+            fh.write('##Original File: ' + (reference_annotation_basename or '') + '\n')
             entries_written = 0
-            for e in entries:
+            for e in (entries or []):
                 try:
                     contig = str(e.get('contig', '.'))
-                    # prefer reference coords if present
                     ref_pos = e.get('ref_pos', '')
                     add_pos = e.get('add_pos', '')
                     if ref_pos:
                         start, stop = ref_pos.split(',')
                         ftype = e.get('ref_type', '') or 'CDS'
-                        source = reference_annotation_basename.split('_')[0] or 'reference'
+                        source = e.get('ref_source') or (reference_annotation_basename.split('_')[0] if reference_annotation_basename else 'reference')
                         info_attr = e.get('ref_info', '')
                     else:
-                        # No ref pos, use add_pos coords
-                        start, stop = add_pos.split(',') if add_pos else ('0','0')
+                        start, stop = add_pos.split(',') if add_pos else ('0', '0')
                         ftype = e.get('add_type', '') or 'CDS'
-                        source = e.get('add_type', '') or 'additional'
+                        source = e.get('add_source') or 'additional'
                         info_attr = e.get('add_info', '')
-                    # attributes
                     attrs = []
                     attrs.append('Status=' + str(e.get('status', '')))
                     attrs.append('Coverage=' + str(e.get('coverage', '')))
                     if e.get('ref_info', ''):
-                        attrs.append('Ref_info=' + str(e.get('ref_info', '')).replace(';','%3B'))
+                        attrs.append('Ref_info=' + str(e.get('ref_info', '')).replace(';', '%3B'))
                     if e.get('add_info', ''):
-                        attrs.append('Add_info=' + str(e.get('add_info', '')).replace(';','%3B'))
+                        attrs.append('Add_info=' + str(e.get('add_info', '')).replace(';', '%3B'))
                     attr_str = ';'.join(attrs)
-                    # construct GFF line
                     line = f"{contig}\t{source}\t{ftype}\t{start}\t{stop}\t.\t.\t.\t{attr_str}\n"
                     fh.write(line)
                     entries_written += 1
                 except Exception:
-                    # skip bad entry
                     continue
         logging.info('Wrote %d discordance GFF entries to %s', entries_written, report_path)
     except OSError as e:
@@ -236,12 +234,9 @@ def compute_discordance(ref_map_by_contig, add_map_by_contig, options):
     - only_in_additional: additional ORFs that don't overlap any reference entry
     - mismatches: reference entries with overlapping additional ORFs that don't meet match criteria
-    This version is strand-aware and will classify mismatches that are due to strand
-    differences separately from type/coverage differences.
     Expected layouts:
-    - ref entry: [strand, 'ref', type, info]
-    - add entry: [strand, ..., type (index 3), info (last element)]
+    - ref entry: [strand, 'ref', type, info, source]
+    - add entry: [strand, ..., type (index 3), info (last element), (optional) source]
     """
     only_in_ref = []
     only_in_additional = []
@@ -255,7 +250,6 @@ def compute_discordance(ref_map_by_contig, add_map_by_contig, options):
         ref_map = ref_map_by_contig.get(contig, {}) or {}
         add_map = add_map_by_contig.get(contig, {}) or {}
-        # For each reference feature, find best overlapping additional ORF and classify
         for rpos, rdata in ref_map.items():
             rstart, rstop = _parse_pos(rpos)
             if rstart is None:
@@ -266,10 +260,10 @@ def compute_discordance(ref_map_by_contig, add_map_by_contig, options):
             best_add_data = None
             matched = False
-            # reference fields
             r_strand = rdata[0] if len(rdata) > 0 else ''
-            r_type = rdata[3] if len(rdata) > 2 else ''
-            r_info = rdata[-1] if len(rdata) > 3 else ''
+            r_type = rdata[2] if len(rdata) > 2 else ''
+            r_info = rdata[3] if len(rdata) > 3 else ''
+            r_source = rdata[4] if len(rdata) > 4 else ''
             for apos, adata in add_map.items():
                 astart, astop = _parse_pos(apos)
@@ -284,27 +278,25 @@ def compute_discordance(ref_map_by_contig, add_map_by_contig, options):
                     best_add = apos
                     best_add_data = adata
-                # additional fields
                 a_strand = adata[0] if len(adata) > 0 else ''
                 a_type = adata[3] if len(adata) > 3 else ''
-                # frame check (distance of stops mod 3)
+                a_info = adata[-1] if len(adata) > 0 else ''
+                a_source = adata[4] if len(adata) > 4 else ''
                 try:
                     frame_ok = ((abs(astop - rstop) % 3) == 0)
                 except Exception:
                     frame_ok = True
-                # check for a fully satisfactory match: type, coverage, strand and frame
                 if a_type == r_type and cov >= cov_thresh and (a_strand == r_strand) and frame_ok:
                     matched = True
                     matched_adds.add((contig, apos))
                     break
             if matched:
-                # good match -> not discordant
                 continue
             if best_add is None:
-                # no overlapping additional ORF found
                 only_in_ref.append({
                     'contig': contig,
                     'ref_pos': rpos,
@@ -314,26 +306,24 @@ def compute_discordance(ref_map_by_contig, add_map_by_contig, options):
                     'status': 'only_in_ref',
                     'coverage': '0.00',
                     'ref_info': r_info,
+                    'ref_source': r_source,
                     'add_info': ''
                 })
             else:
-                # overlapping additional ORF(s) exist but none satisfied the match criteria
                 a_type = best_add_data[3] if len(best_add_data) > 3 else ''
                 a_info = best_add_data[-1] if len(best_add_data) > 0 else ''
                 a_strand = best_add_data[0] if len(best_add_data) > 0 else ''
+                a_source = best_add_data[4] if len(best_add_data) > 4 else ''
-                # compute reason flags
                 type_match = (a_type == r_type)
                 strand_match = (a_strand == r_strand)
                 cov_ok = (best_cov >= cov_thresh)
                 try:
-                    # use frame between best add and ref
                     astart, astop = _parse_pos(best_add)
                     frame_ok = ((abs(astop - rstop) % 3) == 0) if (astop is not None) else True
                 except Exception:
                     frame_ok = True
-                # classify mismatch with strand-awareness
                 if not cov_ok:
                     status = 'found_in_additional_but_below_coverage'
                 elif not type_match and not strand_match:
@@ -356,13 +346,14 @@ def compute_discordance(ref_map_by_contig, add_map_by_contig, options):
                     'status': status,
                     'coverage': f"{best_cov:.2f}",
                     'ref_info': r_info,
+                    'ref_source': r_source,
                     'add_info': a_info,
+                    'add_source': a_source,
                 })
                 if best_add:
                     matched_adds.add((contig, best_add))
-        # Additional-only ORFs: those not matched and not overlapping any reference
         for apos, adata in add_map.items():
             if (contig, apos) in matched_adds:
                 continue
@@ -378,6 +369,7 @@ def compute_discordance(ref_map_by_contig, add_map_by_contig, options):
                     overlapped = True
                     break
             if not overlapped:
+                add_source = adata[4] if len(adata) > 4 else ''
                 only_in_additional.append({
                     'contig': contig,
                     'ref_pos': '',
@@ -388,9 +380,11 @@ def compute_discordance(ref_map_by_contig, add_map_by_contig, options):
                     'coverage': '0.00',
                     'ref_info': '',
                     'add_info': adata[-1] if len(adata) > 0 else '',
+                    'add_source': add_source,
                 })
-    return only_in_ref, only_in_additional, mismatches
+    # Return discordance lists and the set of matched additional ORFs (for overlap counts)
+    return only_in_ref, only_in_additional, mismatches, matched_adds
 def comparator(options):
@@ -491,11 +485,14 @@ def comparator(options):
                     strand = parts[6]
                     pos = f"{start},{stop}"
                     info = parts[8]
+                    source = parts[1] if len(parts) > 1 else ''
                 except (IndexError, ValueError):
                     continue
                 if seqid not in ref_genes_by_contig:
                     ref_genes_by_contig[seqid] = OrderedDict()
-                ref_genes_by_contig[seqid].update({pos: [strand, 'ref', ftype, info]})
+                # Store source from column 1 as well. Layout becomes:
+                # [strand, 'ref', type, info, source]
+                ref_genes_by_contig[seqid].update({pos: [strand, 'ref', ftype, info, source]})
     else:
         # Use a tool parser to produce ref_genes; expect tool to return mapping contig->dict
         try:
@@ -558,12 +555,14 @@ def comparator(options):
                 ref_entry = ref_genes.get(f"{o_Start},{o_Stop}")
                 if not ref_entry:
                     continue
-                # ref_entry layout: [strand, 'ref', type, info]
-                ref_type = ref_entry[3] if len(ref_entry) > 2 else ''
-                ref_info = ref_entry[-1] if len(ref_entry) > 3 else ''
+                # ref_entry layout now: [strand, 'ref', type, info, source]
+                ref_type = ref_entry[2] if len(ref_entry) > 2 else ''
+                ref_info = ref_entry[3] if len(ref_entry) > 3 else ''
+                ref_source = ref_entry[4] if len(ref_entry) > 4 else ''
                 if additional_type == ref_type and o_Strand == ref_entry[0]:
-                    kept.update({f"{o_Start},{o_Stop}": [o_Strand, options.coverage, additional_type, ref_type, additional_info, ref_info]})
+                    # kept layout: [strand, coverage, additional_type, ref_type, additional_info, ref_info, ref_source]
+                    kept.update({f"{o_Start},{o_Stop}": [o_Strand, options.coverage, additional_type, ref_type, additional_info, ref_info, ref_source]})
         else:
             cov_thresh = options.coverage
             for orf, data in orfs.items():
@@ -598,42 +597,43 @@ def comparator(options):
                     cov = 100.0 * overlap / gene_len
                     g_Strand = r_data[0]
-                    # r_data layout: [strand, 'ref', type, info]
-                    ref_type = r_data[3] if len(r_data) > 2 else ''
-                    ref_info = r_data[-1] if len(r_data) > 3 else ''
+                    # r_data layout now: [strand, 'ref', type, info, source]
+                    ref_type = r_data[2] if len(r_data) > 2 else ''
+                    ref_info = r_data[3] if len(r_data) > 3 else ''
+                    ref_source = r_data[4] if len(r_data) > 4 else ''
                     if abs(o_Stop - g_Stop) % 3 == 0 and o_Strand == g_Strand and cov >= cov_thresh:
                         if additional_type == ref_type:
-                            kept[f"{g_Start},{g_Stop}"] = [g_Strand, int(cov), additional_type, ref_type,
-                                                           additional_info, ref_info]
+                            # keep ref_source with the kept entry
+                            kept[f"{g_Start},{g_Stop}"] = [g_Strand, int(cov), additional_type, ref_type, additional_info, ref_info, ref_source]
         genes_To_Keep_by_contig[contig] = sortORFs(kept)
     # Log counts for debugging why GFF might be empty
-    try:
-        total_ref = sum(len(v) for v in ref_genes_by_contig.values()) if ref_genes_by_contig else 0
-    except Exception:
-        total_ref = 0
-    try:
-        total_add = sum(len(v) for v in additional_by_contig.values()) if additional_by_contig else 0
-    except Exception:
-        total_add = 0
-    try:
-        total_kept = sum(len(v) for v in genes_To_Keep_by_contig.values()) if genes_To_Keep_by_contig else 0
-    except Exception:
-        total_kept = 0
-    logging.info('Reference genes loaded: %d', total_ref)
-    logging.info('Additional ORFs loaded: %d', total_add)
-    logging.info('Kept genes after intersection: %d', total_kept)
+    # Compute summary metrics (safe/simple)
+    total_ref = sum(len(v) for v in ref_genes_by_contig.values()) if ref_genes_by_contig else 0
+    total_add = sum(len(v) for v in additional_by_contig.values()) if additional_by_contig else 0
+    total_kept = sum(len(v) for v in genes_To_Keep_by_contig.values()) if genes_To_Keep_by_contig else 0
+    # Print totals in requested order: reference, additional, then overlap/kept and a percentage
+    logging.info('Totals -- reference_genes=%d, additional_genes=%d, overlapping/kept=%d', total_ref, total_add, total_kept)
+    if total_ref:
+        logging.info('Overlap relative to reference: %.2f%%', (100.0 * total_kept / total_ref))
     # If requested, compute discordance lists and write three GFF outputs
     if getattr(options, 'report_discordance', False):
-        # Compute discordance lists
-        only_in_ref, only_in_additional, mismatches = compute_discordance(ref_genes_by_contig, additional_by_contig, options)
+        # Compute discordance lists and matched additional ORFs
+        only_in_ref, only_in_additional, mismatches, matched_adds = compute_discordance(ref_genes_by_contig, additional_by_contig, options)
         base = os.path.splitext(os.path.basename(options.output_file))[0] if getattr(options, 'output_file', None) else 'discordance'
         outdir = os.path.dirname(options.output_file) if getattr(options, 'output_file', None) else '.'
         ref_base = os.path.splitext(os.path.basename(options.reference_annotation))[0]
-        # Keep the three detailed GFF outputs (backward compatible)
+        # Compute and log clear summary metrics
+        total_ref = sum(len(v) for v in ref_genes_by_contig.values()) if ref_genes_by_contig else 0
+        total_add = sum(len(v) for v in additional_by_contig.values()) if additional_by_contig else 0
+        overlapping_additional = len(matched_adds) if matched_adds is not None else 0
+        overlapping_reference = max(0, total_ref - (len(only_in_ref) if only_in_ref is not None else 0))
+        logging.info('Summary: reference_genes=%d, additional_geness=%d, additional_genes_overlapping_any_reference=%d, reference_genes_overlapped=%d', total_ref, total_add, overlapping_additional, overlapping_reference)
+         # Keep the three detailed GFF outputs (backward compatible)
         gff_ref = os.path.join(outdir, f"{base}.only_in_reference.gff")
         gff_add = os.path.join(outdir, f"{base}.only_in_additional.gff")
         gff_mis = os.path.join(outdir, f"{base}.mismatches.gff")
@@ -679,6 +679,7 @@ def comparator(options):
             contig_summary = {}
         logging.info('Kept genes by contig (sample): %s', dict(list(contig_summary.items())[:10]))
         logging.info('Writing combined GFF to %s', options.output_file)
+        # single correct invocation of gff_writer
         gff_writer(genome_ID, genome_DNA_path, options.reference_annotation, getattr(options, 'reference_tool', None), None, options.additional_annotation, options.additional_tool, genes_To_Keep_by_contig, options.output_file, getattr(options, 'gene_ident', None))
         logging.info('gff_writer finished (check output file)')
     except Exception as e:
@@ -688,8 +689,6 @@ def comparator(options):
 def main():
-    print(WELCOME)
     parser = argparse.ArgumentParser(description='ORForise ' + ORForise_Version + ': Annotation-Intersector Run Parameters')
     required = parser.add_argument_group('Required Arguments')
@@ -721,6 +720,20 @@ def main():
 if __name__ == '__main__':
-    main()
-    print('Complete')
+    try:
+        try:
+            main()
+        except Exception:
+            logging.exception('Unhandled exception in main')
+    finally:
+        print(CLOSING)

ORForise/Convert_To_GFF.py CHANGED Viewed

@@ -73,8 +73,6 @@ def load_genome(genome_fasta):
 def main():
-    print(WELCOME)
     parser = argparse.ArgumentParser(description='ORForise ' + ORForise_Version + ': Convert-To-GFF Run Parameters')
     parser._action_groups.pop()
@@ -138,4 +136,10 @@ def main():
     logging.info('Logfile: %s', logfile)
 if __name__ == '__main__':
-    main()
+    try:
+        try:
+            main()
+        except Exception:
+            logging.exception('Unhandled exception in main')
+    finally:
+        print(CLOSING)

ORForise/GFF_Adder.py CHANGED Viewed

@@ -496,8 +496,6 @@ def gff_adder(options):
 def main():
-    print(WELCOME)
     parser = argparse.ArgumentParser(description='ORForise ' + ORForise_Version + ': GFF-Adder Run Parameters.')
     parser._action_groups.pop()
@@ -539,5 +537,10 @@ def main():
 if __name__ == "__main__":
-    main()
-    print("Complete")
+    try:
+        try:
+            main()
+        except Exception:
+            logging.exception('Unhandled exception in main')
+    finally:
+        print(CLOSING)

ORForise/List_Tools.py CHANGED Viewed

@@ -11,8 +11,6 @@ except (ImportError, ModuleNotFoundError):
 def main():
-    print(WELCOME)
     print('ORForise ' + ORForise_Version + ': List Tools Run Parameters')
     tools = set()
@@ -52,5 +50,10 @@ def main():
 if __name__ == "__main__":
-    main()
-    print("Complete")
+    try:
+        try:
+            main()
+        except Exception:
+            print('Unhandled exception in main')
+    finally:
+        print(CLOSING)

ORForise/StORForise.py CHANGED Viewed

@@ -101,7 +101,6 @@ def comparator(tool, input_to_analyse, storfs_to_find_missing, genome_to_compare
 def main():
-    print(WELCOME)
     parser = argparse.ArgumentParser(description='ORForise ' + ORForise_Version + ': StORForise Run Parameters.')
     parser.add_argument('-t', '--tool', default='GFF', help='Which tool/format would you analyse with StORF-R?')
     parser.add_argument('-i', '--input_to_analyse', default='', help='Location of file containing missed genes')
@@ -112,4 +111,10 @@ def main():
     comparator(**vars(args))
 if __name__ == "__main__":
-    main()
+    try:
+        try:
+            main()
+        except Exception:
+            print('Unhandled exception in main')
+    finally:
+        print(CLOSING)

ORForise/Tools/GFF/GFF.py CHANGED Viewed

@@ -31,7 +31,7 @@ def GFF(*args):
         genome_rev = revCompIterative(genome)
         with open(tool_pred, 'r') as gff_input:
             for line in gff_input:
-                if '#' not in line:
+                if not line.startswith('#'):
                     line = line.split('\t')
                     #gene_types = types.split(',') - Temporary fix
                     #if any(gene_type == line[2] for gene_type in gene_types) and len(line) == 9:  # line[2] for normalrun
@@ -68,7 +68,7 @@ def GFF(*args):
                                 stopCodon = genome[stop - 3:stop]
                         po = str(start) + ',' + str(stop)
                         orf = [strand, startCodon, stopCodon, line[2], 'GFF-Standard'] # This needs to detect the type
-                        GFF_ORFs.update({po: orf})
+                        GFF_ORFs[dna_region].update({po: orf})
                     # elif "CDS" in line[2]:
                     #     sys.exit("SAS")

ORForise/Tools/StORF-Reporter/StORF-Reporter.py CHANGED Viewed

@@ -13,8 +13,8 @@ def StORF_Reporter(*args):
     dna_regions = args[1]
     if not dna_regions: # This triggers if dna_regions is an empty dict (GFF_Intersect passed nothing)
         dna_regions = collections.OrderedDict()
-        with open(tool_pred, 'r') as StORF-Reporter_input:
-            for line in StORF-Reporter_input:
+        with open(tool_pred, 'r') as StORF_Reporter_input:
+            for line in StORF_Reporter_input:
                 line = line.split()
                 if 'StORF-Reporter' in line[1] or 'StoRF_Reporter' in line[1]  or 'StORF' in line[1] or 'StORF-Reporter' in line[1] and line[0] not in dna_regions:
                     dna_regions[line[0]] = []  # Placeholder for genome sequence

ORForise/utils.py CHANGED Viewed

@@ -4,8 +4,8 @@ import collections
 # Constants
 SHORT_ORF_LENGTH = 300
 MIN_COVERAGE = 75
-ORForise_Version = 'v1.6.1'
-WELCOME=("Thank you for using ORForise\nPlease report any issues to: https://github.com/NickJD/ORForise/issues\n"
+ORForise_Version = 'v1.6.4'
+CLOSING=("\n####\nThank you for using ORForise\nPlease report any issues to: https://github.com/NickJD/ORForise/issues\n"
         "Please Cite: https://doi.org/10.1093/bioinformatics/btab827\n"
         "#####")

{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: ORForise
-Version: 1.6.2
+Version: 1.6.4
 Summary: ORForise - A platform for analysing and comparing genome annotations.
 Author-email: Nicholas Dimonaco <nicholas@dimonaco.co.uk>
 License:                     GNU GENERAL PUBLIC LICENSE
@@ -662,7 +662,7 @@ Example output files from ```Annotation-Compare```, ```Aggregate-Compare```, ```
 For Help: ```Annotation-Compare -h ```
 ```python
-ORForise v1.6.2: Annotatione-Compare Run Parameters.
+ORForise v1.6.4: Annotatione-Compare Run Parameters.
 Required Arguments:
   -dna GENOME_DNA       Genome DNA file (.fa) which both annotations are based on
@@ -730,7 +730,7 @@ ORForise can be used as the example below.
 For Help: ```Aggregate-Compare -h ```
 ```python
-ORForise v1.6.2: Aggregate-Compare Run Parameters.
+ORForise v1.6.4: Aggregate-Compare Run Parameters.
 Required Arguments:
   -dna GENOME_DNA       Genome DNA file (.fa) which both annotations are based on
@@ -811,7 +811,7 @@ GFF-Adder combines two existing annotations (GFF or other tool formats).
 For Help: ```GFF-Adder -h ```
 ```python
-ORForise v1.6.2: GFF-Adder Run Parameters.
+ORForise v1.6.4: GFF-Adder Run Parameters.
 Required Arguments:
   -dna GENOME_DNA       Genome DNA file (.fa) which both annotations are based on
@@ -868,7 +868,7 @@ usage: Annotation_Intersector.py [-h] -ref REFERENCE_ANNOTATION -at
                                  [-cov COVERAGE] [--report-discordance]
                                  [--report-discordance-file REPORT_DISCORDANCE_FILE]
-ORForise v1.6.2: Annotation-Intersector Run Parameters
+ORForise v1.6.4: Annotation-Intersector Run Parameters
 options:
   -h, --help            show this help message and exit
@@ -947,7 +947,7 @@ Please report any issues to: https://github.com/NickJD/ORForise/issues
 #####
 usage: Convert_To_GFF.py [-h] [-dna GENOME_DNA] -i INPUT_ANNOTATION -fmt FORMAT -o OUTPUT_DIR [-gi GENE_IDENT] [--verbose]
-ORForise v1.6.2: Convert-To-GFF Run Parameters
+ORForise v1.6.4: Convert-To-GFF Run Parameters
 Required Arguments:
   -dna GENOME_DNA      Genome DNA file (.fa)
@@ -1026,7 +1026,7 @@ Defaults options were used.
 **MetaGeneMark - Version '2020'** - http://exon.gatech.edu/meta_gmhmmp.cgi
 GFF was chosen as output type.
-**Prodigal - Version 2.6.3** - https://github.com/hyattpd/Prodigal
+**Prodigal (Includes Pyrodigal) - Version 2.6.3** - https://github.com/hyattpd/Prodigal
 GFF was chosen as output type.
 **TransDecoder - Version 5.5.0** - https://github.com/TransDecoder/TransDecoder/wiki

{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/RECORD RENAMED Viewed

@@ -1,13 +1,13 @@
-ORForise/Aggregate_Compare.py,sha256=T61SdH9cY6KE9HnoVMqEn_yt5GOiG6_GukoVCMiCXaA,22788
-ORForise/Annotation_Compare.py,sha256=kd0J6UpvYlppmjSBenp9-Zrwzu1p5fnfMs8CvofAtXA,18460
-ORForise/Annotation_Intersector.py,sha256=LvV5h4NTZzzkaa1N2tOU8Bz63Fi2kRCy9c4qrmwXdkM,34481
+ORForise/Aggregate_Compare.py,sha256=AzGOfuQLt4haw4rdCwIEag5Y7hnXHLLApkTa6_j99-A,22887
+ORForise/Annotation_Compare.py,sha256=7_LwWKDKZHBrhUWODxTJgd-tppaA4k5IvNuX4bU8_2Q,18571
+ORForise/Annotation_Intersector.py,sha256=7VH7iHk4m1c08AeKf9vGEYuAecsywfC4AQHUlIbgQKQ,35856
 ORForise/Comparator.py,sha256=59VfUS8d19Xa83o1AsCuowDhhe-iNr5wO4FutDpoQRs,48078
-ORForise/Convert_To_GFF.py,sha256=6HUiWQUGOyEohvWDJH3hGLBvCvzFy0MdyZK_K29ikA8,5898
-ORForise/GFF_Adder.py,sha256=dm4JjezKUKHDMINf_lWLtm2nj4uvziJhwp3YYi5wSCg,28560
-ORForise/List_Tools.py,sha256=g46MLl4XU4VDJHeZ7Ky-SwEU9hLTxQ6LCCHG2DasxM8,1519
-ORForise/StORForise.py,sha256=ZlI_wLUE6QFKtRtrAAIEmeYA04Pucl36ys_CHFRO1xE,5650
+ORForise/Convert_To_GFF.py,sha256=zkpO3vpLxA7EpKe1X1i-_IPbcU3lbwLCsh30mmeuZkI,6030
+ORForise/GFF_Adder.py,sha256=PuOZl4TUN9SbMjGhkuF92UDePAnx0NdVAuWFRxR61XA,28670
+ORForise/List_Tools.py,sha256=OZadIWAP0HJ_JYlTDqWw_EA8Mkew-26_cKOkRE4i7ro,1618
+ORForise/StORForise.py,sha256=yRZtKXKcmevxZ_2asesYdkl-qen3MmOn9_r0vb0927I,5772
 ORForise/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-ORForise/utils.py,sha256=sEDOATM5v50g9sKbBf2QinaCnGel7EtnKiR-UebtTwQ,15751
+ORForise/utils.py,sha256=QdXT0XkEIjMbu4ef2HDwAKa_19m8oeu4QV8oLll5gpk,15759
 ORForise/Aux/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 ORForise/Aux/StORF_Undetected/StORF_Undetected.py,sha256=B7f9AxXD6j2ip4QtuOi7pwtfBCxkexE0XiDCJrKSX5U,1318
 ORForise/Aux/StORF_Undetected/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -37,7 +37,7 @@ ORForise/Tools/FGENESB/FGENESB.py,sha256=E6vghsstDeYgmT1lT4DL2M7wreYeXx2s-N-scCu
 ORForise/Tools/FGENESB/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 ORForise/Tools/FragGeneScan/FragGeneScan.py,sha256=koPby-VZZ7X6RA1OBc3-yr9axGlm82LVbFZJ-kyx1Kw,2365
 ORForise/Tools/FragGeneScan/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-ORForise/Tools/GFF/GFF.py,sha256=OBm3UmgusisqV7deUMHkruO3PLdlzr3OAc4OsZmRMdo,3763
+ORForise/Tools/GFF/GFF.py,sha256=Q2BFzfJAqL7QYRhTsjPXAK0vyGtNAtIdPATVW6jMwW8,3784
 ORForise/Tools/GFF/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 ORForise/Tools/GLIMMER3/GLIMMER3.py,sha256=EddNu6M1NrWDbWjvByM9gvStuvWoD5lq5jz0M27oro8,2686
 ORForise/Tools/GLIMMER3/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -61,13 +61,13 @@ ORForise/Tools/Prodigal/Prodigal.py,sha256=1KVkTL3gHp8iSNFt_CvPnLZUr66x1AfE0ZKxo
 ORForise/Tools/Prodigal/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 ORForise/Tools/Prokka/Prokka.py,sha256=Kcl1ocVj6hPOfEEwf8bBAWhzWX_XAe55kwNUeM8EUKg,2468
 ORForise/Tools/Prokka/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-ORForise/Tools/StORF-Reporter/StORF-Reporter.py,sha256=mbpoCuzVDVVFZgSd3TDzgjbp-JsrxIDB-DL2qjQwq-U,2647
+ORForise/Tools/StORF-Reporter/StORF-Reporter.py,sha256=BQpFfpXtcNC4C_P4Bk5IZZ9__Xy2VNcbh7zzSDnrNOE,2647
 ORForise/Tools/StORF-Reporter/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 ORForise/Tools/TransDecoder/TransDecoder.py,sha256=l9y4OFxhSdPRBhUprs0yt2fxtSwyNCOv7oKO-aTvpDk,2381
 ORForise/Tools/TransDecoder/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-orforise-1.6.2.dist-info/licenses/LICENSE,sha256=eAL1bBUjSMCdvudcn9E3sbujCBCa839cqXxauONDbSU,32476
-orforise-1.6.2.dist-info/METADATA,sha256=xqVn0TcMdZkrKeyVbjENidxxhN6PKuHZkb0WC2nx5pE,59554
-orforise-1.6.2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-orforise-1.6.2.dist-info/entry_points.txt,sha256=_HaBzKQFXCkxHIIgBH_XIOng92-GWJ5FC29LmNaSpR0,670
-orforise-1.6.2.dist-info/top_level.txt,sha256=7kmFicUFY65FJmioc0cpZtXVz93V7KSKvZVWpGz5Hyk,9
-orforise-1.6.2.dist-info/RECORD,,
+orforise-1.6.4.dist-info/licenses/LICENSE,sha256=eAL1bBUjSMCdvudcn9E3sbujCBCa839cqXxauONDbSU,32476
+orforise-1.6.4.dist-info/METADATA,sha256=cJbN2ekkUs5mP8izYLMqxv8r4awotKf6DtVQNDvuPFo,59575
+orforise-1.6.4.dist-info/WHEEL,sha256=qELbo2s1Yzl39ZmrAibXA2jjPLUYfnVhUNTlyF1rq0Y,92
+orforise-1.6.4.dist-info/entry_points.txt,sha256=_HaBzKQFXCkxHIIgBH_XIOng92-GWJ5FC29LmNaSpR0,670
+orforise-1.6.4.dist-info/top_level.txt,sha256=7kmFicUFY65FJmioc0cpZtXVz93V7KSKvZVWpGz5Hyk,9
+orforise-1.6.4.dist-info/RECORD,,

{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/WHEEL RENAMED Viewed

@@ -1,5 +1,5 @@
 Wheel-Version: 1.0
-Generator: setuptools (80.9.0)
+Generator: setuptools (80.10.1)
 Root-Is-Purelib: true
 Tag: py3-none-any

{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{orforise-1.6.2.dist-info → orforise-1.6.4.dist-info}/top_level.txt RENAMED Viewed

File without changes

ORForise 1.6.2__py3-none-any.whl → 1.6.4__py3-none-any.whl

ORForise 1.6.2py3-none-any.whl → 1.6.4py3-none-any.whl