bioroebe 0.10.80
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/LICENSE.md +428 -0
- data/README.md +9280 -0
- data/bin/advanced_dotplot +7 -0
- data/bin/align_open_reading_frames +12 -0
- data/bin/all_positions_of_this_nucleotide +7 -0
- data/bin/aminoacid_composition +7 -0
- data/bin/aminoacid_frequencies +12 -0
- data/bin/aminoacid_substitution +7 -0
- data/bin/automatically_rename_this_fasta_file +7 -0
- data/bin/base_composition +7 -0
- data/bin/batch_create_windows_executables +7 -0
- data/bin/biomart_console +11 -0
- data/bin/bioroebe +27 -0
- data/bin/bioroebe_controller +10 -0
- data/bin/bioshell +26 -0
- data/bin/blosum_2D_table +12 -0
- data/bin/calculate_n50_value +12 -0
- data/bin/chunked_display +12 -0
- data/bin/codon_frequency +9 -0
- data/bin/codon_to_aminoacid +30 -0
- data/bin/colourize_this_fasta_sequence +14 -0
- data/bin/compact_fasta_file +7 -0
- data/bin/complement +7 -0
- data/bin/complementary_dna_strand +12 -0
- data/bin/complementary_rna_strand +12 -0
- data/bin/compseq +7 -0
- data/bin/consensus_sequence +17 -0
- data/bin/count_AT +12 -0
- data/bin/count_GC +12 -0
- data/bin/create_random_aminoacids +7 -0
- data/bin/decode_this_aminoacid_sequence +20 -0
- data/bin/deduce_aminoacid_sequence +13 -0
- data/bin/deduce_most_likely_aminoacid_sequence +7 -0
- data/bin/display_aminoacid_table +12 -0
- data/bin/display_open_reading_frames +7 -0
- data/bin/dna_to_aminoacid_sequence +7 -0
- data/bin/dna_to_rna +7 -0
- data/bin/downcase_chunked_display +12 -0
- data/bin/download_this_pdb +7 -0
- data/bin/fasta_index +7 -0
- data/bin/fetch_data_from_uniprot +12 -0
- data/bin/filter_away_invalid_nucleotides +12 -0
- data/bin/find_substring +19 -0
- data/bin/genbank_to_fasta +7 -0
- data/bin/hamming_distance +12 -0
- data/bin/input_as_dna +12 -0
- data/bin/is_palindrome +13 -0
- data/bin/leading_five_prime +7 -0
- data/bin/levensthein +7 -0
- data/bin/longest_ORF +14 -0
- data/bin/longest_substring +12 -0
- data/bin/n_stop_codons_in_this_sequence +15 -0
- data/bin/open_reading_frames +14 -0
- data/bin/overwrite_fasta_header +7 -0
- data/bin/palindrome_2D_structure +7 -0
- data/bin/palindrome_generator +7 -0
- data/bin/parse_fasta +7 -0
- data/bin/partner_nucleotide +9 -0
- data/bin/possible_codons_for_this_aminoacid +12 -0
- data/bin/random_dna_sequence +12 -0
- data/bin/random_sequence +12 -0
- data/bin/raw_hamming_distance +12 -0
- data/bin/return_longest_substring_via_LCS_algorithm +7 -0
- data/bin/reverse_complement +7 -0
- data/bin/reverse_sequence +7 -0
- data/bin/ruler +12 -0
- data/bin/scan_this_input_for_startcodons +12 -0
- data/bin/short_aminoacid_letter_from_long_aminoacid_name +7 -0
- data/bin/show_atomic_composition +7 -0
- data/bin/show_codon_usage +12 -0
- data/bin/show_fasta_header +7 -0
- data/bin/show_nucleotide_sequence +7 -0
- data/bin/show_this_codon_table +7 -0
- data/bin/show_this_dna_sequence +7 -0
- data/bin/showorf +14 -0
- data/bin/simplify_fasta +7 -0
- data/bin/sort_aminoacid_based_on_its_hydrophobicity +7 -0
- data/bin/split_this_fasta_file_into_chromosomes +7 -0
- data/bin/strict_filter_away_invalid_aminoacids +7 -0
- data/bin/taxonomy +63 -0
- data/bin/three_to_one +7 -0
- data/bin/to_rna +7 -0
- data/bin/trailing_three_prime +7 -0
- data/bin/trypsin_digest +7 -0
- data/bin/upcase_this_aminoacid_sequence_and_remove_numbers +7 -0
- data/bioroebe.gemspec +97 -0
- data/doc/IUPAC_aminoacids_code.md +36 -0
- data/doc/IUPAC_nucleotide_code.md +19 -0
- data/doc/README.gen +9237 -0
- data/doc/blosum.md +5 -0
- data/doc/compatibility/BIO_PHP.md +37 -0
- data/doc/compatibility/README.md +3 -0
- data/doc/compatibility/emboss.md +56 -0
- data/doc/extensive_usage_example.md +35 -0
- data/doc/german_names_for_the_aminoacids.md +27 -0
- data/doc/instructions_for_the_taxonomy_subproject.md +504 -0
- data/doc/legacy_paths.md +9 -0
- data/doc/pdb_ATOM_entry.md +33 -0
- data/doc/quality_control/README.md +2 -0
- data/doc/quality_control/commandline_applications.md +13 -0
- data/doc/resources.md +23 -0
- data/doc/setup.rb +1655 -0
- data/doc/statistics/statistics.md +41 -0
- data/doc/todo/README.md +5 -0
- data/doc/todo/bioroebe_GUI_todo.md +15 -0
- data/doc/todo/bioroebe_todo.md +2823 -0
- data/doc/using_biomart.md +258 -0
- data/html/test.html +144 -0
- data/lib/bioroebe/aminoacids/aminoacid_substitution.rb +118 -0
- data/lib/bioroebe/aminoacids/aminoacids_mass_table.rb +118 -0
- data/lib/bioroebe/aminoacids/codon_percentage.rb +189 -0
- data/lib/bioroebe/aminoacids/colourize_hydrophilic_and_hydrophobic_aminoacids.rb +110 -0
- data/lib/bioroebe/aminoacids/create_random_aminoacids.rb +221 -0
- data/lib/bioroebe/aminoacids/deduce_aminoacid_sequence.rb +460 -0
- data/lib/bioroebe/aminoacids/display_aminoacid_table.rb +231 -0
- data/lib/bioroebe/aminoacids/show_hydrophobicity.rb +184 -0
- data/lib/bioroebe/annotations/README.md +2 -0
- data/lib/bioroebe/annotations/create_annotation_format.rb +208 -0
- data/lib/bioroebe/autoinclude.rb +7 -0
- data/lib/bioroebe/base/base.rb +35 -0
- data/lib/bioroebe/base/colours.rb +14 -0
- data/lib/bioroebe/base/colours_for_base/colours_for_base.rb +275 -0
- data/lib/bioroebe/base/commandline_application/README.md +7 -0
- data/lib/bioroebe/base/commandline_application/aminoacids.rb +33 -0
- data/lib/bioroebe/base/commandline_application/commandline_application.rb +37 -0
- data/lib/bioroebe/base/commandline_application/commandline_arguments.rb +144 -0
- data/lib/bioroebe/base/commandline_application/directory.rb +33 -0
- data/lib/bioroebe/base/commandline_application/extract.rb +22 -0
- data/lib/bioroebe/base/commandline_application/misc.rb +485 -0
- data/lib/bioroebe/base/commandline_application/opn.rb +47 -0
- data/lib/bioroebe/base/commandline_application/reset.rb +40 -0
- data/lib/bioroebe/base/commandline_application/warnings.rb +36 -0
- data/lib/bioroebe/base/commandline_application/write_what_into.rb +29 -0
- data/lib/bioroebe/base/initialize.rb +18 -0
- data/lib/bioroebe/base/misc.rb +94 -0
- data/lib/bioroebe/base/namespace.rb +16 -0
- data/lib/bioroebe/base/prototype/README.md +12 -0
- data/lib/bioroebe/base/prototype/e_and_ee.rb +24 -0
- data/lib/bioroebe/base/prototype/misc.rb +108 -0
- data/lib/bioroebe/base/prototype/mkdir.rb +20 -0
- data/lib/bioroebe/base/prototype/prototype.rb +21 -0
- data/lib/bioroebe/base/prototype/reset.rb +26 -0
- data/lib/bioroebe/base/reset.rb +11 -0
- data/lib/bioroebe/biomart/LICENSE.md +27 -0
- data/lib/bioroebe/biomart/attribute.rb +77 -0
- data/lib/bioroebe/biomart/biomart.rb +227 -0
- data/lib/bioroebe/biomart/database.rb +128 -0
- data/lib/bioroebe/biomart/dataset.rb +572 -0
- data/lib/bioroebe/biomart/filter.rb +97 -0
- data/lib/bioroebe/biomart/server.rb +152 -0
- data/lib/bioroebe/blosum/blosum.rb +88 -0
- data/lib/bioroebe/calculate/calculate_blosum_score.rb +145 -0
- data/lib/bioroebe/calculate/calculate_gc_content.rb +301 -0
- data/lib/bioroebe/calculate/calculate_levensthein_distance.rb +100 -0
- data/lib/bioroebe/calculate/calculate_melting_temperature.rb +398 -0
- data/lib/bioroebe/calculate/calculate_melting_temperature_for_more_than_thirteen_nucleotides.rb +304 -0
- data/lib/bioroebe/calculate/calculate_the_position_specific_scoring_matrix.rb +166 -0
- data/lib/bioroebe/cell/README.md +1 -0
- data/lib/bioroebe/cell/cell.rb +63 -0
- data/lib/bioroebe/cleave_and_digest/README.md +2 -0
- data/lib/bioroebe/cleave_and_digest/cleave.rb +80 -0
- data/lib/bioroebe/cleave_and_digest/digestion.rb +75 -0
- data/lib/bioroebe/cleave_and_digest/trypsin.rb +192 -0
- data/lib/bioroebe/codon_tables/README.md +9 -0
- data/lib/bioroebe/codon_tables/frequencies/287_Pseudomonas_aeruginosa.yml +101 -0
- data/lib/bioroebe/codon_tables/frequencies/3702_Arabidopsis_thaliana.yml +77 -0
- data/lib/bioroebe/codon_tables/frequencies/4932_Saccharomyces_cerevisiae.yml +103 -0
- data/lib/bioroebe/codon_tables/frequencies/7227_Drosophila_melanogaster.yml +71 -0
- data/lib/bioroebe/codon_tables/frequencies/83333_Escherichia_coli_K12.yml +103 -0
- data/lib/bioroebe/codon_tables/frequencies/9606_Homo_sapiens.yml +123 -0
- data/lib/bioroebe/codon_tables/frequencies/9685_Felis_catus.yml +78 -0
- data/lib/bioroebe/codon_tables/frequencies/README.md +10 -0
- data/lib/bioroebe/codon_tables/frequencies/parse_frequency_table.rb +337 -0
- data/lib/bioroebe/codons/README.md +28 -0
- data/lib/bioroebe/codons/codon_table.rb +416 -0
- data/lib/bioroebe/codons/codon_tables.rb +123 -0
- data/lib/bioroebe/codons/codons.rb +517 -0
- data/lib/bioroebe/codons/convert_this_codon_to_that_aminoacid.rb +102 -0
- data/lib/bioroebe/codons/detect_minimal_codon.rb +180 -0
- data/lib/bioroebe/codons/determine_optimal_codons.rb +74 -0
- data/lib/bioroebe/codons/possible_codons_for_this_aminoacid.rb +380 -0
- data/lib/bioroebe/codons/sanitize_codon_frequency.rb +144 -0
- data/lib/bioroebe/codons/show_codon_tables.rb +130 -0
- data/lib/bioroebe/codons/show_codon_usage.rb +197 -0
- data/lib/bioroebe/codons/show_this_codon_table.rb +573 -0
- data/lib/bioroebe/codons/start_codons.rb +105 -0
- data/lib/bioroebe/colours/colour_schemes/README.md +10 -0
- data/lib/bioroebe/colours/colour_schemes/array_available_colour_schemes.rb +38 -0
- data/lib/bioroebe/colours/colour_schemes/buried.rb +70 -0
- data/lib/bioroebe/colours/colour_schemes/colour_scheme.rb +101 -0
- data/lib/bioroebe/colours/colour_schemes/colour_scheme_demo.rb +262 -0
- data/lib/bioroebe/colours/colour_schemes/helix.rb +65 -0
- data/lib/bioroebe/colours/colour_schemes/hydropathy.rb +70 -0
- data/lib/bioroebe/colours/colour_schemes/nucleotide.rb +47 -0
- data/lib/bioroebe/colours/colour_schemes/score.rb +112 -0
- data/lib/bioroebe/colours/colour_schemes/simple.rb +42 -0
- data/lib/bioroebe/colours/colour_schemes/strand.rb +65 -0
- data/lib/bioroebe/colours/colour_schemes/taylor.rb +58 -0
- data/lib/bioroebe/colours/colour_schemes/turn.rb +65 -0
- data/lib/bioroebe/colours/colour_schemes/zappo.rb +59 -0
- data/lib/bioroebe/colours/colourize_sequence.rb +262 -0
- data/lib/bioroebe/colours/colours.rb +119 -0
- data/lib/bioroebe/colours/misc_colours.rb +80 -0
- data/lib/bioroebe/colours/rev.rb +41 -0
- data/lib/bioroebe/colours/sdir.rb +21 -0
- data/lib/bioroebe/colours/sfancy.rb +21 -0
- data/lib/bioroebe/colours/sfile.rb +21 -0
- data/lib/bioroebe/colours/simp.rb +21 -0
- data/lib/bioroebe/colours/swarn.rb +29 -0
- data/lib/bioroebe/colours/use_colours.rb +27 -0
- data/lib/bioroebe/configuration/configuration.rb +114 -0
- data/lib/bioroebe/configuration/constants.rb +35 -0
- data/lib/bioroebe/constants/GUIs.rb +79 -0
- data/lib/bioroebe/constants/aminoacids_and_proteins.rb +146 -0
- data/lib/bioroebe/constants/base_directory.rb +120 -0
- data/lib/bioroebe/constants/carriage_return.rb +14 -0
- data/lib/bioroebe/constants/codon_tables.rb +77 -0
- data/lib/bioroebe/constants/database_constants.rb +107 -0
- data/lib/bioroebe/constants/files_and_directories.rb +579 -0
- data/lib/bioroebe/constants/misc.rb +189 -0
- data/lib/bioroebe/constants/newline.rb +14 -0
- data/lib/bioroebe/constants/nucleotides.rb +114 -0
- data/lib/bioroebe/constants/regex.rb +28 -0
- data/lib/bioroebe/constants/roebe.rb +38 -0
- data/lib/bioroebe/constants/row_terminator.rb +16 -0
- data/lib/bioroebe/constants/tabulator.rb +14 -0
- data/lib/bioroebe/constants/unicode.rb +12 -0
- data/lib/bioroebe/constants/urls.rb +50 -0
- data/lib/bioroebe/conversions/README.md +3 -0
- data/lib/bioroebe/conversions/convert_aminoacid_to_dna.rb +298 -0
- data/lib/bioroebe/conversions/dna_to_aminoacid_sequence.rb +569 -0
- data/lib/bioroebe/count/README.md +1 -0
- data/lib/bioroebe/count/count_amount_of_aminoacids.rb +352 -0
- data/lib/bioroebe/count/count_amount_of_nucleotides.rb +491 -0
- data/lib/bioroebe/count/count_at.rb +39 -0
- data/lib/bioroebe/count/count_gc.rb +43 -0
- data/lib/bioroebe/css/README.md +5 -0
- data/lib/bioroebe/css/project.css +121 -0
- data/lib/bioroebe/data/README.md +10 -0
- data/lib/bioroebe/data/bam/README.md +1 -0
- data/lib/bioroebe/data/data.txt +192 -0
- data/lib/bioroebe/data/fasta/GFP_mutant_3_coding_sequence.fasta +12 -0
- data/lib/bioroebe/data/fasta/alu_elements.fasta +42 -0
- data/lib/bioroebe/data/fasta/lady_slippers_orchid.fasta +1197 -0
- data/lib/bioroebe/data/fasta/loxP.fasta +2 -0
- data/lib/bioroebe/data/fasta/ls_orchid.fasta +1197 -0
- data/lib/bioroebe/data/fasta/pax6_in_mouse.fasta +1 -0
- data/lib/bioroebe/data/fasta/test.fasta +7 -0
- data/lib/bioroebe/data/fasta/test_DNA.fasta +1 -0
- data/lib/bioroebe/data/fastq/fastq_example_file.fastq +32 -0
- data/lib/bioroebe/data/fastq/fastq_example_file_SP1.fastq +1000 -0
- data/lib/bioroebe/data/fastq/one_random_fastq_entry.fastq +4 -0
- data/lib/bioroebe/data/genbank/sample_file.genbank +15 -0
- data/lib/bioroebe/data/genbank/standard.fasta +3 -0
- data/lib/bioroebe/data/gff/Escherichia_coli_K12_plasmid_F_DNA_NC_002483.1.gff3 +345 -0
- data/lib/bioroebe/data/gff/sample.gff +2 -0
- data/lib/bioroebe/data/gff/test_gene.gff +4 -0
- data/lib/bioroebe/data/gff/transcripts.gff +16 -0
- data/lib/bioroebe/data/gtf/README.md +1 -0
- data/lib/bioroebe/data/json/example_config.json +48 -0
- data/lib/bioroebe/data/pdb/1VII.pdb +754 -0
- data/lib/bioroebe/data/pdb/ala_phe_ala.pdb +228 -0
- data/lib/bioroebe/data/pdb/rcsb_pdb_1VII.fasta +2 -0
- data/lib/bioroebe/data/phylip/README.md +11 -0
- data/lib/bioroebe/data/phylip/example.phylip +7 -0
- data/lib/bioroebe/data/svg/example.svg +301 -0
- data/lib/bioroebe/databases/README.md +1 -0
- data/lib/bioroebe/databases/download_taxonomy_database.rb +102 -0
- data/lib/bioroebe/dotplots/README.md +5 -0
- data/lib/bioroebe/dotplots/advanced_dotplot.rb +256 -0
- data/lib/bioroebe/dotplots/dotplot.rb +184 -0
- data/lib/bioroebe/electron_microscopy/coordinate_analyzer.rb +191 -0
- data/lib/bioroebe/electron_microscopy/fix_pos_file.rb +102 -0
- data/lib/bioroebe/electron_microscopy/generate_em2em_file.rb +122 -0
- data/lib/bioroebe/electron_microscopy/parse_coordinates.rb +197 -0
- data/lib/bioroebe/electron_microscopy/read_file_xmd.rb +282 -0
- data/lib/bioroebe/electron_microscopy/simple_star_file_generator.rb +131 -0
- data/lib/bioroebe/encoding/README.md +2 -0
- data/lib/bioroebe/encoding/encoding.rb +45 -0
- data/lib/bioroebe/enzymes/README.md +2 -0
- data/lib/bioroebe/enzymes/has_this_restriction_enzyme.rb +46 -0
- data/lib/bioroebe/enzymes/restriction_enzyme.rb +200 -0
- data/lib/bioroebe/enzymes/restriction_enzymes_file.rb +72 -0
- data/lib/bioroebe/enzymes/return_restriction_enzyme_sequence_and_cut_position.rb +80 -0
- data/lib/bioroebe/enzymes/return_sequence_that_is_cut_via_restriction_enzyme.rb +65 -0
- data/lib/bioroebe/enzymes/show_restriction_enzymes.rb +119 -0
- data/lib/bioroebe/exceptions/README.md +2 -0
- data/lib/bioroebe/exceptions/exceptions.rb +17 -0
- data/lib/bioroebe/ext/LICENCE.md +5 -0
- data/lib/bioroebe/ext/README.md +7 -0
- data/lib/bioroebe/ext/main.cpp +45 -0
- data/lib/bioroebe/ext/nucleotide.cpp +24 -0
- data/lib/bioroebe/ext/nussinov_algorithm.cpp +348 -0
- data/lib/bioroebe/ext/sequence +0 -0
- data/lib/bioroebe/ext/sequence.cpp +162 -0
- data/lib/bioroebe/fasta_and_fastq/README.md +6 -0
- data/lib/bioroebe/fasta_and_fastq/autocorrect_the_name_of_this_fasta_file.rb +88 -0
- data/lib/bioroebe/fasta_and_fastq/compact_fasta_file/compact_fasta_file.rb +151 -0
- data/lib/bioroebe/fasta_and_fastq/display_how_many_fasta_entries_are_in_this_directory.rb +111 -0
- data/lib/bioroebe/fasta_and_fastq/download_fasta.rb +248 -0
- data/lib/bioroebe/fasta_and_fastq/fasta_defline/README.md +2 -0
- data/lib/bioroebe/fasta_and_fastq/fasta_defline/fasta_defline.rb +113 -0
- data/lib/bioroebe/fasta_and_fastq/fasta_parser.rb +167 -0
- data/lib/bioroebe/fasta_and_fastq/fastq_format_explainer.rb +131 -0
- data/lib/bioroebe/fasta_and_fastq/length_modifier/length_modifier.rb +87 -0
- data/lib/bioroebe/fasta_and_fastq/parse_fasta/constants.rb +50 -0
- data/lib/bioroebe/fasta_and_fastq/parse_fasta/initialize.rb +86 -0
- data/lib/bioroebe/fasta_and_fastq/parse_fasta/menu.rb +117 -0
- data/lib/bioroebe/fasta_and_fastq/parse_fasta/misc.rb +981 -0
- data/lib/bioroebe/fasta_and_fastq/parse_fasta/parse_fasta.rb +27 -0
- data/lib/bioroebe/fasta_and_fastq/parse_fasta/report.rb +156 -0
- data/lib/bioroebe/fasta_and_fastq/parse_fasta/reset.rb +128 -0
- data/lib/bioroebe/fasta_and_fastq/parse_fasta/run.rb +20 -0
- data/lib/bioroebe/fasta_and_fastq/parse_fastq/parse_fastq.rb +83 -0
- data/lib/bioroebe/fasta_and_fastq/return_fasta_subsection_of_this_file.rb +112 -0
- data/lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb +135 -0
- data/lib/bioroebe/fasta_and_fastq/show_fasta_statistics.rb +188 -0
- data/lib/bioroebe/fasta_and_fastq/simplify_fasta_header/simplify_fasta_header.rb +111 -0
- data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/constants.rb +26 -0
- data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/menu.rb +41 -0
- data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/misc.rb +23 -0
- data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/reset.rb +68 -0
- data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/split_this_fasta_file_into_chromosomes.rb +290 -0
- data/lib/bioroebe/genbank/README.md +1 -0
- data/lib/bioroebe/genbank/genbank_flat_file_format_generator.rb +275 -0
- data/lib/bioroebe/genbank/genbank_parser.rb +291 -0
- data/lib/bioroebe/gene/gene.rb +64 -0
- data/lib/bioroebe/genomes/genome_pattern.rb +165 -0
- data/lib/bioroebe/genomes/genome_retriever.rb +79 -0
- data/lib/bioroebe/gui/experimental/README.md +1 -0
- data/lib/bioroebe/gui/experimental/snapgene/snapgene.rb +147 -0
- data/lib/bioroebe/gui/gtk3/README.md +2 -0
- data/lib/bioroebe/gui/gtk3/alignment/alignment.rb +337 -0
- data/lib/bioroebe/gui/gtk3/aminoacid_composition/aminoacid_composition.rb +510 -0
- data/lib/bioroebe/gui/gtk3/aminoacid_composition/customized_dialog.rb +55 -0
- data/lib/bioroebe/gui/gtk3/anti_sense_strand/anti_sense_strand.config +6 -0
- data/lib/bioroebe/gui/gtk3/anti_sense_strand/anti_sense_strand.rb +29 -0
- data/lib/bioroebe/gui/gtk3/blosum_matrix_viewer/blosum_matrix_viewer.rb +196 -0
- data/lib/bioroebe/gui/gtk3/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.config +6 -0
- data/lib/bioroebe/gui/gtk3/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +106 -0
- data/lib/bioroebe/gui/gtk3/controller/controller.rb +406 -0
- data/lib/bioroebe/gui/gtk3/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +609 -0
- data/lib/bioroebe/gui/gtk3/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.config +6 -0
- data/lib/bioroebe/gui/gtk3/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +189 -0
- data/lib/bioroebe/gui/gtk3/fasta_table_widget/fasta_table_widget.rb +245 -0
- data/lib/bioroebe/gui/gtk3/format_converter/format_converter.rb +346 -0
- data/lib/bioroebe/gui/gtk3/gene/gene.rb +182 -0
- data/lib/bioroebe/gui/gtk3/hamming_distance/hamming_distance.config +6 -0
- data/lib/bioroebe/gui/gtk3/hamming_distance/hamming_distance.rb +370 -0
- data/lib/bioroebe/gui/gtk3/levensthein_distance/levensthein_distance.config +6 -0
- data/lib/bioroebe/gui/gtk3/levensthein_distance/levensthein_distance.rb +175 -0
- data/lib/bioroebe/gui/gtk3/nucleotide_analyser/nucleotide_analyser.rb +428 -0
- data/lib/bioroebe/gui/gtk3/parse_pdb_file/parse_pdb_file.rb +342 -0
- data/lib/bioroebe/gui/gtk3/primer_design_widget/primer_design_widget.rb +580 -0
- data/lib/bioroebe/gui/gtk3/protein_to_DNA/protein_to_DNA.config +6 -0
- data/lib/bioroebe/gui/gtk3/protein_to_DNA/protein_to_DNA.rb +182 -0
- data/lib/bioroebe/gui/gtk3/random_sequence/random_sequence.rb +566 -0
- data/lib/bioroebe/gui/gtk3/restriction_enzymes/restriction_enzymes.config +6 -0
- data/lib/bioroebe/gui/gtk3/restriction_enzymes/restriction_enzymes.rb +329 -0
- data/lib/bioroebe/gui/gtk3/show_codon_table/misc.rb +556 -0
- data/lib/bioroebe/gui/gtk3/show_codon_table/show_codon_table.rb +171 -0
- data/lib/bioroebe/gui/gtk3/show_codon_usage/show_codon_usage.rb +146 -0
- data/lib/bioroebe/gui/gtk3/sizeseq/sizeseq.rb +207 -0
- data/lib/bioroebe/gui/gtk3/three_to_one/three_to_one.rb +279 -0
- data/lib/bioroebe/gui/gtk3/three_to_one/title.rb +23 -0
- data/lib/bioroebe/gui/gtk3/www_finder/www_finder.config +6 -0
- data/lib/bioroebe/gui/gtk3/www_finder/www_finder.rb +368 -0
- data/lib/bioroebe/gui/jruby/blosum_matrix_viewer/blosum_matrix_viewer.rb +82 -0
- data/lib/bioroebe/gui/libui/README.md +4 -0
- data/lib/bioroebe/gui/libui/alignment/alignment.rb +114 -0
- data/lib/bioroebe/gui/libui/blosum_matrix_viewer/blosum_matrix_viewer.rb +112 -0
- data/lib/bioroebe/gui/libui/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +60 -0
- data/lib/bioroebe/gui/libui/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +161 -0
- data/lib/bioroebe/gui/libui/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +76 -0
- data/lib/bioroebe/gui/libui/hamming_distance/hamming_distance.rb +135 -0
- data/lib/bioroebe/gui/libui/levensthein_distance/levensthein_distance.rb +118 -0
- data/lib/bioroebe/gui/libui/protein_to_DNA/protein_to_DNA.rb +115 -0
- data/lib/bioroebe/gui/libui/random_sequence/random_sequence.rb +174 -0
- data/lib/bioroebe/gui/libui/show_codon_table/show_codon_table.rb +132 -0
- data/lib/bioroebe/gui/libui/show_codon_usage/show_codon_usage.rb +89 -0
- data/lib/bioroebe/gui/libui/three_to_one/three_to_one.rb +111 -0
- data/lib/bioroebe/gui/shared_code/blosum_matrix_viewer/blosum_matrix_viewer_module.rb +42 -0
- data/lib/bioroebe/gui/shared_code/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria_module.rb +216 -0
- data/lib/bioroebe/gui/shared_code/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget_module.rb +284 -0
- data/lib/bioroebe/gui/shared_code/levensthein_distance/levensthein_distance_module.rb +402 -0
- data/lib/bioroebe/gui/shared_code/protein_to_DNA/protein_to_DNA_module.rb +192 -0
- data/lib/bioroebe/gui/shared_code/show_codon_table/show_codon_table_module.rb +72 -0
- data/lib/bioroebe/gui/shared_code/show_codon_usage/show_codon_usage_module.rb +213 -0
- data/lib/bioroebe/gui/tk/aminoacid_composition/aminoacid_composition.rb +206 -0
- data/lib/bioroebe/gui/tk/blosum_matrix_viewer/blosum_matrix_viewer.rb +140 -0
- data/lib/bioroebe/gui/tk/hamming_distance/hamming_distance.rb +262 -0
- data/lib/bioroebe/gui/tk/levensthein_distance/levensthein_distance.rb +243 -0
- data/lib/bioroebe/gui/tk/three_to_one/three_to_one.rb +199 -0
- data/lib/bioroebe/gui/unified_widgets/anti_sense_strand/anti_sense_strand.rb +519 -0
- data/lib/bioroebe/images/BIOROEBE.png +0 -0
- data/lib/bioroebe/images/BIOROEBE_NEW_LOGO.png +0 -0
- data/lib/bioroebe/images/BlosumMatrixViewer.png +0 -0
- data/lib/bioroebe/images/DnaToAminoacidWidget.png +0 -0
- data/lib/bioroebe/images/PRINTED_AMINOACID_TABLE.png +0 -0
- data/lib/bioroebe/images/class_ConvertAminoacidToDNA.png +0 -0
- data/lib/bioroebe/images/class_SimpleStringComparer.png +0 -0
- data/lib/bioroebe/images/example_of_FASTA_coloured_output.png +0 -0
- data/lib/bioroebe/images/libui_hamming_distance_widget.png +0 -0
- data/lib/bioroebe/images/pretty_DNA_picture.png +0 -0
- data/lib/bioroebe/images/primer_design_widget.png +0 -0
- data/lib/bioroebe/images/restriction_enzyme_commandline_result.png +0 -0
- data/lib/bioroebe/images/ruby-gtk_three_to_one_widget.png +0 -0
- data/lib/bioroebe/images/small_DNA_logo.png +0 -0
- data/lib/bioroebe/images/small_drosophila_image.png +0 -0
- data/lib/bioroebe/java/README.md +6 -0
- data/lib/bioroebe/java/bioroebe/AllInOne.class +0 -0
- data/lib/bioroebe/java/bioroebe/AllInOne.java +214 -0
- data/lib/bioroebe/java/bioroebe/Base.class +0 -0
- data/lib/bioroebe/java/bioroebe/Base.java +102 -0
- data/lib/bioroebe/java/bioroebe/BisulfiteTreatment.class +0 -0
- data/lib/bioroebe/java/bioroebe/BisulfiteTreatment.java +23 -0
- data/lib/bioroebe/java/bioroebe/Cat.class +0 -0
- data/lib/bioroebe/java/bioroebe/Codons.class +0 -0
- data/lib/bioroebe/java/bioroebe/Codons.java +22 -0
- data/lib/bioroebe/java/bioroebe/Esystem.class +0 -0
- data/lib/bioroebe/java/bioroebe/Esystem.java +47 -0
- data/lib/bioroebe/java/bioroebe/GUI/BaseFrame.class +0 -0
- data/lib/bioroebe/java/bioroebe/GUI/BaseFrame.java +65 -0
- data/lib/bioroebe/java/bioroebe/GenerateRandomDnaSequence.class +0 -0
- data/lib/bioroebe/java/bioroebe/GenerateRandomDnaSequence.java +32 -0
- data/lib/bioroebe/java/bioroebe/IsPalindrome.class +0 -0
- data/lib/bioroebe/java/bioroebe/IsPalindrome.java +18 -0
- data/lib/bioroebe/java/bioroebe/PartnerNucleotide.class +0 -0
- data/lib/bioroebe/java/bioroebe/PartnerNucleotide.java +19 -0
- data/lib/bioroebe/java/bioroebe/README.md +4 -0
- data/lib/bioroebe/java/bioroebe/RemoveFile.class +0 -0
- data/lib/bioroebe/java/bioroebe/RemoveFile.java +24 -0
- data/lib/bioroebe/java/bioroebe/RemoveNumbers.class +0 -0
- data/lib/bioroebe/java/bioroebe/RemoveNumbers.java +14 -0
- data/lib/bioroebe/java/bioroebe/SanitizeNucleotideSequence.class +0 -0
- data/lib/bioroebe/java/bioroebe/SanitizeNucleotideSequence.java +20 -0
- data/lib/bioroebe/java/bioroebe/SaveFile.java +44 -0
- data/lib/bioroebe/java/bioroebe/Sequence.java +28 -0
- data/lib/bioroebe/java/bioroebe/ToCamelcase.class +0 -0
- data/lib/bioroebe/java/bioroebe/ToCamelcase.java +32 -0
- data/lib/bioroebe/java/bioroebe/ToplevelMethods.class +0 -0
- data/lib/bioroebe/java/bioroebe/ToplevelMethods.java +15 -0
- data/lib/bioroebe/java/bioroebe/enums/DNA.java +6 -0
- data/lib/bioroebe/java/bioroebe.jar +0 -0
- data/lib/bioroebe/matplotlib/matplotlib_generator.rb +104 -0
- data/lib/bioroebe/misc/quiz/README.md +6 -0
- data/lib/bioroebe/misc/quiz/three_letter_to_aminoacid.rb +163 -0
- data/lib/bioroebe/misc/ruler.rb +244 -0
- data/lib/bioroebe/misc/useful_formulas.rb +129 -0
- data/lib/bioroebe/ncbi/efetch.rb +253 -0
- data/lib/bioroebe/ncbi/ncbi.rb +93 -0
- data/lib/bioroebe/ngs/README.md +2 -0
- data/lib/bioroebe/ngs/phred_quality_score_table.rb +123 -0
- data/lib/bioroebe/nucleotides/complementary_dna_strand.rb +166 -0
- data/lib/bioroebe/nucleotides/molecular_weight_of_nucleotides.rb +135 -0
- data/lib/bioroebe/nucleotides/most_likely_nucleotide_sequence_for_this_aminoacid_sequence.rb +198 -0
- data/lib/bioroebe/nucleotides/sanitize_nucleotide_sequence.rb +133 -0
- data/lib/bioroebe/nucleotides/show_nucleotide_sequence.rb +556 -0
- data/lib/bioroebe/palindromes/palindrome_2D_structure.rb +139 -0
- data/lib/bioroebe/palindromes/palindrome_finder.rb +208 -0
- data/lib/bioroebe/palindromes/palindrome_generator.rb +272 -0
- data/lib/bioroebe/parsers/biolang_parser.rb +156 -0
- data/lib/bioroebe/parsers/blosum_parser.rb +222 -0
- data/lib/bioroebe/parsers/genbank_parser.rb +78 -0
- data/lib/bioroebe/parsers/gff.rb +346 -0
- data/lib/bioroebe/parsers/parse_embl.rb +76 -0
- data/lib/bioroebe/parsers/stride_parser.rb +117 -0
- data/lib/bioroebe/patterns/README.md +5 -0
- data/lib/bioroebe/patterns/analyse_glycosylation_pattern.rb +149 -0
- data/lib/bioroebe/patterns/is_this_sequence_a_EGF2_pattern.rb +66 -0
- data/lib/bioroebe/patterns/profile_pattern.rb +182 -0
- data/lib/bioroebe/patterns/rgg_scanner.rb +160 -0
- data/lib/bioroebe/patterns/scan_for_repeat.rb +157 -0
- data/lib/bioroebe/pdb/download_this_pdb.rb +67 -0
- data/lib/bioroebe/pdb/fetch_fasta_sequence_from_pdb.rb +164 -0
- data/lib/bioroebe/pdb/parse_mmCIF_file.rb +63 -0
- data/lib/bioroebe/pdb/parse_pdb_file.rb +1086 -0
- data/lib/bioroebe/pdb/report_secondary_structures_from_this_pdb_file.rb +225 -0
- data/lib/bioroebe/perl/README.md +7 -0
- data/lib/bioroebe/perl/local_to_global.pl +694 -0
- data/lib/bioroebe/project/project.rb +264 -0
- data/lib/bioroebe/protein_structure/alpha_helix.rb +96 -0
- data/lib/bioroebe/protein_structure/helical_wheel.rb +205 -0
- data/lib/bioroebe/raw_sequence/README.md +17 -0
- data/lib/bioroebe/raw_sequence/raw_sequence.rb +557 -0
- data/lib/bioroebe/readline/README.md +2 -0
- data/lib/bioroebe/readline/readline.rb +31 -0
- data/lib/bioroebe/regexes/README.md +2 -0
- data/lib/bioroebe/regexes/regexes.rb +34 -0
- data/lib/bioroebe/requires/commandline_application.rb +5 -0
- data/lib/bioroebe/requires/require_all_aminoacids_files.rb +28 -0
- data/lib/bioroebe/requires/require_all_calculate_files.rb +26 -0
- data/lib/bioroebe/requires/require_all_codon_files.rb +26 -0
- data/lib/bioroebe/requires/require_all_colour_scheme_files.rb +26 -0
- data/lib/bioroebe/requires/require_all_count_files.rb +26 -0
- data/lib/bioroebe/requires/require_all_dotplot_files.rb +28 -0
- data/lib/bioroebe/requires/require_all_electron_microscopy_files.rb +26 -0
- data/lib/bioroebe/requires/require_all_enzymes_files.rb +28 -0
- data/lib/bioroebe/requires/require_all_fasta_and_fastq_files.rb +32 -0
- data/lib/bioroebe/requires/require_all_nucleotides_files.rb +28 -0
- data/lib/bioroebe/requires/require_all_palindromes_files.rb +29 -0
- data/lib/bioroebe/requires/require_all_parser_files.rb +28 -0
- data/lib/bioroebe/requires/require_all_pattern_files.rb +29 -0
- data/lib/bioroebe/requires/require_all_pdb_files.rb +26 -0
- data/lib/bioroebe/requires/require_all_sequence_files.rb +26 -0
- data/lib/bioroebe/requires/require_all_string_matching_files.rb +28 -0
- data/lib/bioroebe/requires/require_all_svg_files.rb +12 -0
- data/lib/bioroebe/requires/require_all_taxonomy_files.rb +35 -0
- data/lib/bioroebe/requires/require_all_utility_scripts_files.rb +32 -0
- data/lib/bioroebe/requires/require_cleave_and_digest.rb +24 -0
- data/lib/bioroebe/requires/require_colours.rb +20 -0
- data/lib/bioroebe/requires/require_encoding.rb +7 -0
- data/lib/bioroebe/requires/require_sequence.rb +7 -0
- data/lib/bioroebe/requires/require_the_bioroebe_project.rb +162 -0
- data/lib/bioroebe/requires/require_the_bioroebe_shell.rb +7 -0
- data/lib/bioroebe/requires/require_the_bioroebe_sinatra_components.rb +7 -0
- data/lib/bioroebe/requires/require_the_constants.rb +23 -0
- data/lib/bioroebe/requires/require_the_toplevel_methods.rb +29 -0
- data/lib/bioroebe/requires/require_yaml.rb +94 -0
- data/lib/bioroebe/sequence/alignment.rb +214 -0
- data/lib/bioroebe/sequence/dna.rb +211 -0
- data/lib/bioroebe/sequence/nucleotide_module/nucleotide_module.rb +404 -0
- data/lib/bioroebe/sequence/protein.rb +281 -0
- data/lib/bioroebe/sequence/reverse_complement.rb +148 -0
- data/lib/bioroebe/sequence/sequence.rb +706 -0
- data/lib/bioroebe/shell/add.rb +108 -0
- data/lib/bioroebe/shell/assign.rb +360 -0
- data/lib/bioroebe/shell/chop_and_cut.rb +281 -0
- data/lib/bioroebe/shell/colours/colours.rb +235 -0
- data/lib/bioroebe/shell/configuration/additionally_set_xorg_buffer.yml +1 -0
- data/lib/bioroebe/shell/configuration/may_we_show_the_startup_information.yml +1 -0
- data/lib/bioroebe/shell/configuration/upcase_nucleotides.yml +1 -0
- data/lib/bioroebe/shell/configuration/use_silent_startup.yml +1 -0
- data/lib/bioroebe/shell/constants.rb +166 -0
- data/lib/bioroebe/shell/download.rb +335 -0
- data/lib/bioroebe/shell/enable_and_disable.rb +158 -0
- data/lib/bioroebe/shell/enzymes.rb +310 -0
- data/lib/bioroebe/shell/fasta.rb +345 -0
- data/lib/bioroebe/shell/gtk.rb +76 -0
- data/lib/bioroebe/shell/help/class.rb +443 -0
- data/lib/bioroebe/shell/help/help.rb +25 -0
- data/lib/bioroebe/shell/history.rb +132 -0
- data/lib/bioroebe/shell/initialize.rb +217 -0
- data/lib/bioroebe/shell/loop.rb +74 -0
- data/lib/bioroebe/shell/menu.rb +5320 -0
- data/lib/bioroebe/shell/misc.rb +4341 -0
- data/lib/bioroebe/shell/prompt.rb +107 -0
- data/lib/bioroebe/shell/random.rb +289 -0
- data/lib/bioroebe/shell/readline/readline.rb +91 -0
- data/lib/bioroebe/shell/reset.rb +335 -0
- data/lib/bioroebe/shell/scan_and_parse.rb +135 -0
- data/lib/bioroebe/shell/search.rb +337 -0
- data/lib/bioroebe/shell/sequences.rb +200 -0
- data/lib/bioroebe/shell/shell.rb +41 -0
- data/lib/bioroebe/shell/show_report_and_display.rb +2901 -0
- data/lib/bioroebe/shell/startup.rb +127 -0
- data/lib/bioroebe/shell/taxonomy.rb +14 -0
- data/lib/bioroebe/shell/tk.rb +23 -0
- data/lib/bioroebe/shell/user_input.rb +88 -0
- data/lib/bioroebe/shell/xorg.rb +45 -0
- data/lib/bioroebe/siRNA/README.md +2 -0
- data/lib/bioroebe/siRNA/siRNA.rb +93 -0
- data/lib/bioroebe/string_matching/README.md +13 -0
- data/lib/bioroebe/string_matching/find_longest_substring.rb +162 -0
- data/lib/bioroebe/string_matching/find_longest_substring_via_LCS_algorithm.rb +175 -0
- data/lib/bioroebe/string_matching/hamming_distance.rb +313 -0
- data/lib/bioroebe/string_matching/levensthein.rb +698 -0
- data/lib/bioroebe/string_matching/simple_string_comparer.rb +294 -0
- data/lib/bioroebe/string_matching/smith_waterman.rb +276 -0
- data/lib/bioroebe/svg/README.md +1 -0
- data/lib/bioroebe/svg/glyph.rb +719 -0
- data/lib/bioroebe/svg/mini_feature.rb +111 -0
- data/lib/bioroebe/svg/page.rb +570 -0
- data/lib/bioroebe/svg/primitive.rb +70 -0
- data/lib/bioroebe/svg/svgee.rb +326 -0
- data/lib/bioroebe/svg/track.rb +263 -0
- data/lib/bioroebe/taxonomy/README.md +1 -0
- data/lib/bioroebe/taxonomy/chart.rb +95 -0
- data/lib/bioroebe/taxonomy/class_methods.rb +181 -0
- data/lib/bioroebe/taxonomy/colours.rb +26 -0
- data/lib/bioroebe/taxonomy/constants.rb +218 -0
- data/lib/bioroebe/taxonomy/edit.rb +97 -0
- data/lib/bioroebe/taxonomy/help/help.rb +65 -0
- data/lib/bioroebe/taxonomy/help/helpline.rb +53 -0
- data/lib/bioroebe/taxonomy/info/check_available.rb +143 -0
- data/lib/bioroebe/taxonomy/info/info.rb +337 -0
- data/lib/bioroebe/taxonomy/info/is_dna.rb +150 -0
- data/lib/bioroebe/taxonomy/interactive.rb +1933 -0
- data/lib/bioroebe/taxonomy/menu.rb +905 -0
- data/lib/bioroebe/taxonomy/node.rb +118 -0
- data/lib/bioroebe/taxonomy/parse_fasta.rb +383 -0
- data/lib/bioroebe/taxonomy/shared.rb +287 -0
- data/lib/bioroebe/taxonomy/taxonomy.rb +521 -0
- data/lib/bioroebe/toplevel_methods/ad_hoc_task.rb +56 -0
- data/lib/bioroebe/toplevel_methods/aminoacids_and_proteins.rb +715 -0
- data/lib/bioroebe/toplevel_methods/atomic_composition.rb +198 -0
- data/lib/bioroebe/toplevel_methods/base_composition.rb +121 -0
- data/lib/bioroebe/toplevel_methods/blast.rb +153 -0
- data/lib/bioroebe/toplevel_methods/calculate_n50_value.rb +57 -0
- data/lib/bioroebe/toplevel_methods/cat.rb +71 -0
- data/lib/bioroebe/toplevel_methods/chunked_display.rb +92 -0
- data/lib/bioroebe/toplevel_methods/cliner.rb +81 -0
- data/lib/bioroebe/toplevel_methods/complement.rb +58 -0
- data/lib/bioroebe/toplevel_methods/convert_global_env.rb +39 -0
- data/lib/bioroebe/toplevel_methods/databases.rb +73 -0
- data/lib/bioroebe/toplevel_methods/delimiter.rb +19 -0
- data/lib/bioroebe/toplevel_methods/digest.rb +71 -0
- data/lib/bioroebe/toplevel_methods/download_and_fetch_data.rb +146 -0
- data/lib/bioroebe/toplevel_methods/e.rb +20 -0
- data/lib/bioroebe/toplevel_methods/editor.rb +21 -0
- data/lib/bioroebe/toplevel_methods/esystem.rb +22 -0
- data/lib/bioroebe/toplevel_methods/exponential_growth.rb +74 -0
- data/lib/bioroebe/toplevel_methods/extract.rb +56 -0
- data/lib/bioroebe/toplevel_methods/fasta_and_fastq.rb +353 -0
- data/lib/bioroebe/toplevel_methods/file_and_directory_related_actions.rb +257 -0
- data/lib/bioroebe/toplevel_methods/frequencies.rb +92 -0
- data/lib/bioroebe/toplevel_methods/hamming_distance.rb +60 -0
- data/lib/bioroebe/toplevel_methods/infer.rb +66 -0
- data/lib/bioroebe/toplevel_methods/is_on_roebe.rb +39 -0
- data/lib/bioroebe/toplevel_methods/leading_five_prime_and_trailing_three_prime.rb +101 -0
- data/lib/bioroebe/toplevel_methods/levensthein.rb +63 -0
- data/lib/bioroebe/toplevel_methods/log_directory.rb +109 -0
- data/lib/bioroebe/toplevel_methods/longest_common_substring.rb +55 -0
- data/lib/bioroebe/toplevel_methods/map_ncbi_entry_to_eutils_id.rb +88 -0
- data/lib/bioroebe/toplevel_methods/matches.rb +259 -0
- data/lib/bioroebe/toplevel_methods/misc.rb +432 -0
- data/lib/bioroebe/toplevel_methods/nucleotides.rb +715 -0
- data/lib/bioroebe/toplevel_methods/number_of_clones.rb +63 -0
- data/lib/bioroebe/toplevel_methods/open_in_browser.rb +77 -0
- data/lib/bioroebe/toplevel_methods/open_reading_frames.rb +236 -0
- data/lib/bioroebe/toplevel_methods/opn.rb +34 -0
- data/lib/bioroebe/toplevel_methods/palindromes.rb +127 -0
- data/lib/bioroebe/toplevel_methods/parse.rb +59 -0
- data/lib/bioroebe/toplevel_methods/phred_error_probability.rb +68 -0
- data/lib/bioroebe/toplevel_methods/rds.rb +24 -0
- data/lib/bioroebe/toplevel_methods/remove.rb +86 -0
- data/lib/bioroebe/toplevel_methods/return_source_code_of_this_method.rb +35 -0
- data/lib/bioroebe/toplevel_methods/return_subsequence_based_on_indices.rb +68 -0
- data/lib/bioroebe/toplevel_methods/rna_splicing.rb +73 -0
- data/lib/bioroebe/toplevel_methods/rnalfold.rb +69 -0
- data/lib/bioroebe/toplevel_methods/searching_and_finding.rb +116 -0
- data/lib/bioroebe/toplevel_methods/shuffleseq.rb +37 -0
- data/lib/bioroebe/toplevel_methods/statistics.rb +53 -0
- data/lib/bioroebe/toplevel_methods/sum_of_odd_integers.rb +62 -0
- data/lib/bioroebe/toplevel_methods/taxonomy.rb +187 -0
- data/lib/bioroebe/toplevel_methods/three_delimiter.rb +34 -0
- data/lib/bioroebe/toplevel_methods/time_and_date.rb +53 -0
- data/lib/bioroebe/toplevel_methods/to_camelcase.rb +26 -0
- data/lib/bioroebe/toplevel_methods/truncate.rb +48 -0
- data/lib/bioroebe/toplevel_methods/url.rb +36 -0
- data/lib/bioroebe/toplevel_methods/verbose.rb +59 -0
- data/lib/bioroebe/utility_scripts/align_open_reading_frames.rb +191 -0
- data/lib/bioroebe/utility_scripts/analyse_local_dataset.rb +119 -0
- data/lib/bioroebe/utility_scripts/check_for_mismatches/check_for_mismatches.rb +230 -0
- data/lib/bioroebe/utility_scripts/compacter.rb +131 -0
- data/lib/bioroebe/utility_scripts/compseq/compseq.rb +529 -0
- data/lib/bioroebe/utility_scripts/consensus_sequence.rb +374 -0
- data/lib/bioroebe/utility_scripts/create_batch_entrez_file.rb +130 -0
- data/lib/bioroebe/utility_scripts/determine_antigenic_areas.rb +115 -0
- data/lib/bioroebe/utility_scripts/determine_missing_nucleotides_percentage.rb +137 -0
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/determine.rb +73 -0
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/display_open_reading_frames.rb +31 -0
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/initialize.rb +37 -0
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/menu.rb +49 -0
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/misc.rb +471 -0
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/report.rb +113 -0
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/reset.rb +56 -0
- data/lib/bioroebe/utility_scripts/dot_alignment.rb +177 -0
- data/lib/bioroebe/utility_scripts/download_files_from_rebase.rb +72 -0
- data/lib/bioroebe/utility_scripts/find_gene.rb +202 -0
- data/lib/bioroebe/utility_scripts/mirror_repeat.rb +235 -0
- data/lib/bioroebe/utility_scripts/move_file_to_its_correct_location.rb +151 -0
- data/lib/bioroebe/utility_scripts/parse_taxonomy.rb +168 -0
- data/lib/bioroebe/utility_scripts/pathways.rb +152 -0
- data/lib/bioroebe/utility_scripts/permutations.rb +145 -0
- data/lib/bioroebe/utility_scripts/punnet/punnet.rb +126 -0
- data/lib/bioroebe/utility_scripts/show_this_dna_sequence.rb +148 -0
- data/lib/bioroebe/utility_scripts/showorf/constants.rb +36 -0
- data/lib/bioroebe/utility_scripts/showorf/help.rb +33 -0
- data/lib/bioroebe/utility_scripts/showorf/initialize.rb +52 -0
- data/lib/bioroebe/utility_scripts/showorf/menu.rb +68 -0
- data/lib/bioroebe/utility_scripts/showorf/reset.rb +39 -0
- data/lib/bioroebe/utility_scripts/showorf/run.rb +152 -0
- data/lib/bioroebe/utility_scripts/showorf/show.rb +97 -0
- data/lib/bioroebe/utility_scripts/showorf/showorf.rb +488 -0
- data/lib/bioroebe/version/version.rb +44 -0
- data/lib/bioroebe/viennarna/README.md +3 -0
- data/lib/bioroebe/viennarna/rnafold_wrapper.rb +196 -0
- data/lib/bioroebe/with_gui.rb +18 -0
- data/lib/bioroebe/www/bioroebe.cgi +44 -0
- data/lib/bioroebe/www/embeddable_interface.rb +686 -0
- data/lib/bioroebe/www/sinatra/sinatra.rb +1013 -0
- data/lib/bioroebe/yaml/agarose/agarose_concentrations.yml +21 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids.yml +92 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_abbreviations.yml +31 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_average_mass_table.yml +33 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_classification.yml +18 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_english.yml +26 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_frequency.yml +44 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_long_name_to_one_letter.yml +61 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_molecular_formula.yml +32 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_monoisotopic_mass_table.yml +38 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_reste.yml +35 -0
- data/lib/bioroebe/yaml/aminoacids/amino_acids_three_to_one.yml +34 -0
- data/lib/bioroebe/yaml/aminoacids/hydropathy_table.yml +44 -0
- data/lib/bioroebe/yaml/aminoacids/molecular_weight.yml +29 -0
- data/lib/bioroebe/yaml/aminoacids/simple_aminoacids.yml +66 -0
- data/lib/bioroebe/yaml/aminoacids/weight_of_common_proteins.yml +33 -0
- data/lib/bioroebe/yaml/antisense/antisense.yml +9 -0
- data/lib/bioroebe/yaml/base_composition_of_dna.yml +37 -0
- data/lib/bioroebe/yaml/blosum/blosum45.yml +36 -0
- data/lib/bioroebe/yaml/blosum/blosum50.yml +34 -0
- data/lib/bioroebe/yaml/blosum/blosum62.yml +35 -0
- data/lib/bioroebe/yaml/blosum/blosum80.yml +37 -0
- data/lib/bioroebe/yaml/blosum/blosum90.yml +36 -0
- data/lib/bioroebe/yaml/blosum/blosum_matrix.yml +200 -0
- data/lib/bioroebe/yaml/chromosomes/chromosome_numbers.yml +30 -0
- data/lib/bioroebe/yaml/codon_tables/1.yml +113 -0
- data/lib/bioroebe/yaml/codon_tables/10.yml +89 -0
- data/lib/bioroebe/yaml/codon_tables/11.yml +91 -0
- data/lib/bioroebe/yaml/codon_tables/12.yml +89 -0
- data/lib/bioroebe/yaml/codon_tables/13.yml +89 -0
- data/lib/bioroebe/yaml/codon_tables/14.yml +89 -0
- data/lib/bioroebe/yaml/codon_tables/15.yml +94 -0
- data/lib/bioroebe/yaml/codon_tables/16.yml +89 -0
- data/lib/bioroebe/yaml/codon_tables/2.yml +86 -0
- data/lib/bioroebe/yaml/codon_tables/21.yml +89 -0
- data/lib/bioroebe/yaml/codon_tables/22.yml +89 -0
- data/lib/bioroebe/yaml/codon_tables/23.yml +91 -0
- data/lib/bioroebe/yaml/codon_tables/24.yml +89 -0
- data/lib/bioroebe/yaml/codon_tables/25.yml +89 -0
- data/lib/bioroebe/yaml/codon_tables/26.yml +96 -0
- data/lib/bioroebe/yaml/codon_tables/27.yml +104 -0
- data/lib/bioroebe/yaml/codon_tables/28.yml +97 -0
- data/lib/bioroebe/yaml/codon_tables/29.yml +93 -0
- data/lib/bioroebe/yaml/codon_tables/3.yml +98 -0
- data/lib/bioroebe/yaml/codon_tables/30.yml +91 -0
- data/lib/bioroebe/yaml/codon_tables/31.yml +94 -0
- data/lib/bioroebe/yaml/codon_tables/33.yml +101 -0
- data/lib/bioroebe/yaml/codon_tables/4.yml +96 -0
- data/lib/bioroebe/yaml/codon_tables/5.yml +100 -0
- data/lib/bioroebe/yaml/codon_tables/6.yml +96 -0
- data/lib/bioroebe/yaml/codon_tables/9.yml +97 -0
- data/lib/bioroebe/yaml/codon_tables/overview.yml +42 -0
- data/lib/bioroebe/yaml/configuration/README.md +12 -0
- data/lib/bioroebe/yaml/configuration/browser.yml +1 -0
- data/lib/bioroebe/yaml/configuration/colourize_fasta_sequences.yml +14 -0
- data/lib/bioroebe/yaml/configuration/default_colours_for_the_aminoacids.yml +28 -0
- data/lib/bioroebe/yaml/configuration/temp_dir.yml +1 -0
- data/lib/bioroebe/yaml/configuration/try_to_use_matplotlib.yml +1 -0
- data/lib/bioroebe/yaml/configuration/use_opn.yml +1 -0
- data/lib/bioroebe/yaml/configuration/use_this_database.yml +1 -0
- data/lib/bioroebe/yaml/create_these_directories_on_startup/create_these_directories_on_startup.yml +9 -0
- data/lib/bioroebe/yaml/default_dna_input.yml +3 -0
- data/lib/bioroebe/yaml/enzymes/enzyme_classes.yml +15 -0
- data/lib/bioroebe/yaml/enzymes/pH-Optima.yml +11 -0
- data/lib/bioroebe/yaml/fasta_and_fastq/fastq_quality_schemes.yml +44 -0
- data/lib/bioroebe/yaml/genomes/README.md +16 -0
- data/lib/bioroebe/yaml/humans/README.md +2 -0
- data/lib/bioroebe/yaml/humans/human_chromosomes.yml +53 -0
- data/lib/bioroebe/yaml/laboratory/README.md +1 -0
- data/lib/bioroebe/yaml/laboratory/pipettes.yml +8 -0
- data/lib/bioroebe/yaml/mRNA/mRNA.yml +16 -0
- data/lib/bioroebe/yaml/nuclear_localization_sequences.yml +15 -0
- data/lib/bioroebe/yaml/nucleotides/abbreviations_for_nucleotides.yml +29 -0
- data/lib/bioroebe/yaml/nucleotides/nucleotide_density.yml +10 -0
- data/lib/bioroebe/yaml/nucleotides/nucleotides.yml +34 -0
- data/lib/bioroebe/yaml/nucleotides/nucleotides_weight.yml +12 -0
- data/lib/bioroebe/yaml/pathways/README.md +2 -0
- data/lib/bioroebe/yaml/pathways/citric_acid_cycle.yml +16 -0
- data/lib/bioroebe/yaml/pathways/glycolysis.yml +20 -0
- data/lib/bioroebe/yaml/pathways/shikimate_pathway.yml +23 -0
- data/lib/bioroebe/yaml/pathways/urea_cycle.yml +11 -0
- data/lib/bioroebe/yaml/primers/README.md +4 -0
- data/lib/bioroebe/yaml/primers/primers.yml +3 -0
- data/lib/bioroebe/yaml/promoters/35S.yml +15 -0
- data/lib/bioroebe/yaml/promoters/strong_promoters.yml +24 -0
- data/lib/bioroebe/yaml/proteases/proteases.yml +3 -0
- data/lib/bioroebe/yaml/proteins/ubiquitin.yml +4 -0
- data/lib/bioroebe/yaml/remote_urls/README.md +4 -0
- data/lib/bioroebe/yaml/remote_urls/remote_urls.yml +3 -0
- data/lib/bioroebe/yaml/restriction_enzymes/restriction_enzymes.yml +630 -0
- data/lib/bioroebe/yaml/sequences/JX472995_Green_fluorescent_protein_from_Aequorea_victoria.fasta +14 -0
- data/lib/bioroebe/yaml/sequences/README.md +2 -0
- data/lib/bioroebe/yaml/talens.yml +22 -0
- data/lib/bioroebe/yaml/viruses/ecoli_phages.yml +63 -0
- data/lib/bioroebe/yaml/viruses/viruses.yml +6 -0
- data/lib/bioroebe.rb +5 -0
- data/spec/testing_toplevel_method_editor.rb +20 -0
- data/spec/testing_toplevel_method_url.rb +15 -0
- data/spec/testing_toplevel_method_verbose.rb +13 -0
- data/test/advanced_svg_example.rb +307 -0
- data/test/testing_bioroebe.rb +25 -0
- data/test/testing_codons.rb +45 -0
- data/test/testing_dna_to_rna_conversion.rb +15 -0
- data/test/testing_parse_pdb_file.rb +23 -0
- data/test/testing_reverse_complement.rb +32 -0
- data/test/testing_svg_component_of_bioroebe.rb +311 -0
- data/test/testing_svg_component_of_bioroebe_from_json_dataset.rb +34 -0
- data/test/testing_taxonomy.rb +22 -0
- metadata +1059 -0
@@ -0,0 +1,198 @@
|
|
1
|
+
#!/usr/bin/ruby -w
|
2
|
+
# Encoding: UTF-8
|
3
|
+
# frozen_string_literal: true
|
4
|
+
# =========================================================================== #
|
5
|
+
# require 'bioroebe/toplevel_methods/atomic_composition.rb'
|
6
|
+
# Bioroebe.show_atomic_composition
|
7
|
+
# =========================================================================== #
|
8
|
+
module Bioroebe
|
9
|
+
|
10
|
+
require 'bioroebe/constants/files_and_directories.rb'
|
11
|
+
require 'bioroebe/colours/rev.rb'
|
12
|
+
require 'bioroebe/toplevel_methods/aminoacids_and_proteins.rb'
|
13
|
+
require 'bioroebe/toplevel_methods/e.rb'
|
14
|
+
require 'bioroebe/toplevel_methods/is_on_roebe.rb'
|
15
|
+
|
16
|
+
# ========================================================================= #
|
17
|
+
# === Bioroebe.atomic_composition
|
18
|
+
#
|
19
|
+
# This method will return the composition of atoms in a given protein,
|
20
|
+
# via Hash, such as:
|
21
|
+
#
|
22
|
+
# {"C"=>11, "H"=>19, "N"=>5, "O"=>6, "S"=>0}
|
23
|
+
#
|
24
|
+
# The Hash keeps track of 11 C atoms, 19 H atoms, 5 N atoms,
|
25
|
+
# 6 O atoms and 0 S atoms.
|
26
|
+
#
|
27
|
+
# This hash can then be formatted via the method:
|
28
|
+
#
|
29
|
+
# Bioroebe.show_atomic_composition()
|
30
|
+
#
|
31
|
+
# Which can be found below.
|
32
|
+
#
|
33
|
+
# Presently this method works on aminoacids only, but in theory the
|
34
|
+
# code could be extended to work with DNA nucleotides and RNA
|
35
|
+
# nucleotides as well.
|
36
|
+
#
|
37
|
+
# Either way, the one letter abbreviation should be used as input
|
38
|
+
# to this method.
|
39
|
+
#
|
40
|
+
# When we use aminoacids, we need to remember that a peptide bond
|
41
|
+
# deducts 1x H₂O (water). This will have to be deducted from the
|
42
|
+
# formula, but only if it is an internal aminoacid. In other words,
|
43
|
+
# the only two aminoacids that will behave differently, are the
|
44
|
+
# first one (since it will miss one -OH group) and the last
|
45
|
+
# aminoacid (as this one will lack a -H molecule.
|
46
|
+
#
|
47
|
+
# Remember that the input sequence to this method should be the
|
48
|
+
# one-letter code for the aminoacid sequence at hand.
|
49
|
+
# ========================================================================= #
|
50
|
+
def self.atomic_composition(
|
51
|
+
of = 'GGGGA' # ← This should be the aminoacid sequence.
|
52
|
+
)
|
53
|
+
begin
|
54
|
+
require 'chemistry_paradise/split_molecule_names.rb'
|
55
|
+
require 'chemistry_paradise/toplevel_methods/remove_this_molecule_from.rb'
|
56
|
+
rescue LoadError
|
57
|
+
if is_on_roebe?
|
58
|
+
puts 'Two files from the chemistry_paradise gem are not available.'
|
59
|
+
end
|
60
|
+
end
|
61
|
+
# ======================================================================= #
|
62
|
+
# Load up the molecular formula for each aminoacid next. This will
|
63
|
+
# be used as our reference-point for calculating things such as the
|
64
|
+
# composition, or weight.
|
65
|
+
# ======================================================================= #
|
66
|
+
dataset_molecular_formula_for_the_aminoacids = YAML.load_file(
|
67
|
+
FILE_AMINOACIDS_MOLECULAR_FORMULA
|
68
|
+
)
|
69
|
+
if of.is_a?(Array)
|
70
|
+
if of.empty?
|
71
|
+
of = 'GGGGA' # In this case reinstate the default.
|
72
|
+
else
|
73
|
+
if of.first.is_a?(String) and of.first.size > 1
|
74
|
+
of = of.first.split(//) # Split it on a per-character basis here.
|
75
|
+
end
|
76
|
+
end
|
77
|
+
end
|
78
|
+
if of.is_a? String
|
79
|
+
of = of.split(//)
|
80
|
+
end
|
81
|
+
unless of.is_a? Array
|
82
|
+
of = [of]
|
83
|
+
end
|
84
|
+
hash_keeping_track_of_the_atomic_composition = {}
|
85
|
+
# ======================================================================= #
|
86
|
+
# Build up the default values, for the atoms C, H, N, O and S.
|
87
|
+
# ======================================================================= #
|
88
|
+
hash_keeping_track_of_the_atomic_composition['C'] = 0
|
89
|
+
hash_keeping_track_of_the_atomic_composition['H'] = 0
|
90
|
+
hash_keeping_track_of_the_atomic_composition['N'] = 0
|
91
|
+
hash_keeping_track_of_the_atomic_composition['O'] = 0
|
92
|
+
hash_keeping_track_of_the_atomic_composition['S'] = 0
|
93
|
+
# ======================================================================= #
|
94
|
+
# Next obtain the formula from the ChemistryParadise project. We
|
95
|
+
# do so by iterating over the given input, and we assume that
|
96
|
+
# this input is always an Array.
|
97
|
+
# ======================================================================= #
|
98
|
+
of.map.with_index {|this_amino_acid, position_of_that_aminoacid|
|
99
|
+
# ===================================================================== #
|
100
|
+
# Next, we have to obtain the formula for this amino acid.
|
101
|
+
# ===================================================================== #
|
102
|
+
this_amino_acid = AMINO_ACIDS_ENGLISH[this_amino_acid]
|
103
|
+
formula_for_this_amino_acid = dataset_molecular_formula_for_the_aminoacids[this_amino_acid]
|
104
|
+
# ===================================================================== #
|
105
|
+
# The next case-menu will handle the position of the aminoacid at hand.
|
106
|
+
# We will skip doing so if there is only one aminoacid though.
|
107
|
+
# ===================================================================== #
|
108
|
+
if of.first.to_s.size > 1
|
109
|
+
case position_of_that_aminoacid # case tag
|
110
|
+
when 0 # This is the first aminoacid. It loses only one 'OH' group.
|
111
|
+
formula_for_this_amino_acid =
|
112
|
+
::ChemistryParadise.remove_this_molecule_from('OH', formula_for_this_amino_acid)
|
113
|
+
when (of.size - 1) # This is the last entry. It loses only one 'H' group.
|
114
|
+
formula_for_this_amino_acid =
|
115
|
+
::ChemistryParadise.remove_this_molecule_from('H', formula_for_this_amino_acid)
|
116
|
+
else
|
117
|
+
# ================================================================= #
|
118
|
+
# Else it will lose a full H₂O group.
|
119
|
+
# ================================================================= #
|
120
|
+
formula_for_this_amino_acid =
|
121
|
+
::ChemistryParadise.remove_this_molecule_from('H2O', formula_for_this_amino_acid)
|
122
|
+
end
|
123
|
+
end
|
124
|
+
array_chemical_formula = ::ChemistryParadise.split_this_molecular_formula_into_a_hash(
|
125
|
+
formula_for_this_amino_acid
|
126
|
+
)
|
127
|
+
array_chemical_formula.each {|molecule_and_number| # e. g. 'H13'
|
128
|
+
if molecule_and_number =~ /\d+/ # If it has at the least one number.
|
129
|
+
molecule_and_number =~ /([A-Z]+)(\d{1,2})/ # See: https://rubular.com/r/nCojEDcY6g
|
130
|
+
molecule = $1.to_s.dup
|
131
|
+
n_times = $2.to_s.dup.to_i
|
132
|
+
hash_keeping_track_of_the_atomic_composition[molecule] += n_times
|
133
|
+
else # else it must be 1, since there is no other number, such as 'N'.
|
134
|
+
hash_keeping_track_of_the_atomic_composition[molecule_and_number] += 1
|
135
|
+
end
|
136
|
+
}
|
137
|
+
}
|
138
|
+
return hash_keeping_track_of_the_atomic_composition
|
139
|
+
end
|
140
|
+
|
141
|
+
# ========================================================================= #
|
142
|
+
# === Bioroebe.show_atomic_composition
|
143
|
+
#
|
144
|
+
# This method will output the above.
|
145
|
+
#
|
146
|
+
# Display style is similar to ExPASY output.
|
147
|
+
#
|
148
|
+
# Atomic composition:
|
149
|
+
#
|
150
|
+
# Carbon C 11
|
151
|
+
# Hydrogen H 19
|
152
|
+
# Nitrogen N 5
|
153
|
+
# Oxygen O 6
|
154
|
+
# Sulfur S 0
|
155
|
+
#
|
156
|
+
# ========================================================================= #
|
157
|
+
def self.show_atomic_composition(
|
158
|
+
of = 'GGGGA'
|
159
|
+
)
|
160
|
+
if of.is_a? Array
|
161
|
+
of = of.join(' ').strip
|
162
|
+
end
|
163
|
+
padding_to_use = ' '
|
164
|
+
hash = ::Bioroebe.atomic_composition(of)
|
165
|
+
_ = ''.dup
|
166
|
+
_ << "#{rev}Atomic composition of #{steelblue(of)}#{rev}:\n\n"
|
167
|
+
n_atoms_in_total = hash.values.sum
|
168
|
+
array = %w( C H N O S )
|
169
|
+
array.each {|this_atom|
|
170
|
+
case this_atom
|
171
|
+
when 'C'
|
172
|
+
_ << "#{padding_to_use}#{rev}Carbon C #{hash[this_atom].to_s.rjust(4)}\n"
|
173
|
+
when 'H'
|
174
|
+
_ << "#{padding_to_use}#{rev}Hydrogen H #{hash[this_atom].to_s.rjust(4)}\n"
|
175
|
+
when 'N'
|
176
|
+
_ << "#{padding_to_use}#{rev}Nitrogen N #{hash[this_atom].to_s.rjust(4)}\n"
|
177
|
+
when 'O'
|
178
|
+
_ << "#{padding_to_use}#{rev}Oxygen O #{hash[this_atom].to_s.rjust(4)}\n"
|
179
|
+
when 'S'
|
180
|
+
_ << "#{padding_to_use}#{rev}Sulfur S #{hash[this_atom].to_s.rjust(4)}\n"
|
181
|
+
end
|
182
|
+
}
|
183
|
+
_ << " "+("-" * 18)
|
184
|
+
_ << "\n"
|
185
|
+
_ << " Total: #{n_atoms_in_total}\n\n"
|
186
|
+
puts _
|
187
|
+
end
|
188
|
+
|
189
|
+
end
|
190
|
+
|
191
|
+
if __FILE__ == $PROGRAM_NAME
|
192
|
+
if ARGV.empty?
|
193
|
+
pp Bioroebe.atomic_composition(ARGV)
|
194
|
+
Bioroebe.show_atomic_composition
|
195
|
+
else
|
196
|
+
Bioroebe.show_atomic_composition(ARGV)
|
197
|
+
end
|
198
|
+
end # atomiccomposition GGGGA
|
@@ -0,0 +1,121 @@
|
|
1
|
+
#!/usr/bin/ruby -w
|
2
|
+
# Encoding: UTF-8
|
3
|
+
# frozen_string_literal: true
|
4
|
+
# =========================================================================== #
|
5
|
+
# require 'bioroebe/toplevel_methods/base_composition.rb'
|
6
|
+
# Bioroebe.report_base_composition
|
7
|
+
# =========================================================================== #
|
8
|
+
module Bioroebe
|
9
|
+
|
10
|
+
require 'bioroebe/colours/colours.rb'
|
11
|
+
require 'bioroebe/colours/rev.rb'
|
12
|
+
require 'bioroebe/toplevel_methods/e.rb'
|
13
|
+
|
14
|
+
# ========================================================================= #
|
15
|
+
# === Bioroebe.base_composition
|
16
|
+
#
|
17
|
+
# This method can be used to query the composition of a given DNA
|
18
|
+
# sequence, that is, in percentage, the values for A, T, C and
|
19
|
+
# G.
|
20
|
+
#
|
21
|
+
# This method will then return a Hash, consisting of the percentage
|
22
|
+
# values of A, T, C and G in the given DNA sequence at hand.
|
23
|
+
#
|
24
|
+
# Note that the input to this method has to include a '%' character,
|
25
|
+
# at the least up until March 2020. Past March 2020 this requirement
|
26
|
+
# was dropped, but I still think it is visually more elegant to
|
27
|
+
# include a '%' character.
|
28
|
+
# ========================================================================= #
|
29
|
+
def self.base_composition(
|
30
|
+
i = '52%GC'
|
31
|
+
)
|
32
|
+
if i.is_a? Array
|
33
|
+
if i.empty?
|
34
|
+
i = '52%GC' # Default value.
|
35
|
+
else
|
36
|
+
i = i.join(' ').strip
|
37
|
+
end
|
38
|
+
end
|
39
|
+
# ======================================================================= #
|
40
|
+
# Add support for Files here.
|
41
|
+
# ======================================================================= #
|
42
|
+
if i and File.exist?(i)
|
43
|
+
i = File.readlines(i).reject {|line| line.start_with? '>' }.join("\n").delete("\n")
|
44
|
+
end
|
45
|
+
# ======================================================================= #
|
46
|
+
# We must use a Hash for this.
|
47
|
+
# ======================================================================= #
|
48
|
+
hash = {
|
49
|
+
'A' => 0,
|
50
|
+
'T' => 0,
|
51
|
+
'C' => 0,
|
52
|
+
'G' => 0,
|
53
|
+
}
|
54
|
+
if i.include? '%'
|
55
|
+
splitted = i.split('%').map(&:strip)
|
56
|
+
frequency = splitted.first.to_i
|
57
|
+
opposite_frequency = 100 - frequency
|
58
|
+
characters = splitted.last.split(//)
|
59
|
+
characters.each {|this_nucleotide|
|
60
|
+
hash[this_nucleotide] = frequency / 2
|
61
|
+
}
|
62
|
+
# ===================================================================== #
|
63
|
+
# Next calculate the missing nucleotides:
|
64
|
+
# ===================================================================== #
|
65
|
+
missing_nucleotides = hash.select {|key, value|
|
66
|
+
value == 0
|
67
|
+
}
|
68
|
+
missing_nucleotides.each_pair {|this_nucleotide, value|
|
69
|
+
hash[this_nucleotide] = opposite_frequency / 2
|
70
|
+
}
|
71
|
+
else
|
72
|
+
frequency = Hash.new(0)
|
73
|
+
chars = i.chars
|
74
|
+
chars.each { |entry| frequency[entry] += 1 }
|
75
|
+
sum = frequency.values.sum
|
76
|
+
frequency.each_pair {|this_nucleotide, value|
|
77
|
+
hash[this_nucleotide] = ((value * 100.0) / sum).round(2)
|
78
|
+
}
|
79
|
+
end
|
80
|
+
return hash
|
81
|
+
end; self.instance_eval { alias frequency_of base_composition } # === Bioroebe.frequency_of
|
82
|
+
|
83
|
+
# ========================================================================= #
|
84
|
+
# === Bioroebe.report_base_composition
|
85
|
+
#
|
86
|
+
# This is the convenience-method for reporting the base composition
|
87
|
+
# at hand.
|
88
|
+
# ========================================================================= #
|
89
|
+
def self.report_base_composition(
|
90
|
+
i = '52%GC'
|
91
|
+
)
|
92
|
+
if i.is_a? Array
|
93
|
+
if i.empty?
|
94
|
+
i = '52%GC' # Default value.
|
95
|
+
else
|
96
|
+
i = i.join(' ').strip
|
97
|
+
end
|
98
|
+
end
|
99
|
+
hash = ::Bioroebe.base_composition(i)
|
100
|
+
a = hash['A']
|
101
|
+
t = hash['T']
|
102
|
+
c = hash['C']
|
103
|
+
g = hash['G']
|
104
|
+
erev 'The base composition frequencies of this sequence '\
|
105
|
+
'(length: '+i.size.to_s+') is as follows:'
|
106
|
+
e
|
107
|
+
e ' '\
|
108
|
+
' A: '+steelblue(a.to_s+'%')+rev+
|
109
|
+
' T: '+steelblue(t.to_s+'%')+rev+
|
110
|
+
' C: '+steelblue(c.to_s+'%')+rev+
|
111
|
+
' G: '+steelblue(g.to_s+'%')+rev
|
112
|
+
e
|
113
|
+
end; self.instance_eval { alias show_base_composition report_base_composition } # === show_base_composition
|
114
|
+
|
115
|
+
end
|
116
|
+
|
117
|
+
if __FILE__ == $PROGRAM_NAME
|
118
|
+
pp Bioroebe.base_composition(ARGV)
|
119
|
+
Bioroebe.report_base_composition(ARGV)
|
120
|
+
end # basecomposition ATGC
|
121
|
+
# basecomposition ATTGCCCCCCCCAACCCCACA
|
@@ -0,0 +1,153 @@
|
|
1
|
+
#!/usr/bin/ruby -w
|
2
|
+
# Encoding: UTF-8
|
3
|
+
# frozen_string_literal: true
|
4
|
+
# =========================================================================== #
|
5
|
+
# require 'bioroebe/toplevel_methods/blast.rb'
|
6
|
+
# =========================================================================== #
|
7
|
+
module Bioroebe
|
8
|
+
|
9
|
+
# ========================================================================= #
|
10
|
+
# === Bioroebe.blast_neighborhood
|
11
|
+
#
|
12
|
+
# The second argument to this method is a score-filter, e. g. to
|
13
|
+
# select only entries that have a score higher than 1.
|
14
|
+
# ========================================================================= #
|
15
|
+
def self.blast_neighborhood(
|
16
|
+
this_mer = 'CTC',
|
17
|
+
optional_apply_filter_for_score_higher_than = nil
|
18
|
+
)
|
19
|
+
require 'bioroebe/toplevel_methods/e.rb'
|
20
|
+
if this_mer.is_a? Array
|
21
|
+
this_mer = this_mer.first
|
22
|
+
end
|
23
|
+
if this_mer.nil?
|
24
|
+
this_mer = 'CTC' # Set the same default as above.
|
25
|
+
end
|
26
|
+
match_score = 2
|
27
|
+
mis_match_score = -2
|
28
|
+
# ======================================================================= #
|
29
|
+
# Next use an Array of sequences that we will compare.
|
30
|
+
# ======================================================================= #
|
31
|
+
compare_these_sequences = %w(
|
32
|
+
AAA
|
33
|
+
AAT
|
34
|
+
AAC
|
35
|
+
AAG
|
36
|
+
ATA
|
37
|
+
ATT
|
38
|
+
ATC
|
39
|
+
ATG
|
40
|
+
ACA
|
41
|
+
ACT
|
42
|
+
ACC
|
43
|
+
ACG
|
44
|
+
AGA
|
45
|
+
AGT
|
46
|
+
AGC
|
47
|
+
AGG
|
48
|
+
TAA
|
49
|
+
TAT
|
50
|
+
TAC
|
51
|
+
TAG
|
52
|
+
TTA
|
53
|
+
TTT
|
54
|
+
TTC
|
55
|
+
TTG
|
56
|
+
TCA
|
57
|
+
TCT
|
58
|
+
TCC
|
59
|
+
TCG
|
60
|
+
TGA
|
61
|
+
TGT
|
62
|
+
TGC
|
63
|
+
TGG
|
64
|
+
CAA
|
65
|
+
CAT
|
66
|
+
CAC
|
67
|
+
CAG
|
68
|
+
CTA
|
69
|
+
CTT
|
70
|
+
CTC
|
71
|
+
CTG
|
72
|
+
CCA
|
73
|
+
CCT
|
74
|
+
CCC
|
75
|
+
CCG
|
76
|
+
CGA
|
77
|
+
CGT
|
78
|
+
CGC
|
79
|
+
CGG
|
80
|
+
GAA
|
81
|
+
GAT
|
82
|
+
GAC
|
83
|
+
GAG
|
84
|
+
GTA
|
85
|
+
GTT
|
86
|
+
GTC
|
87
|
+
GTG
|
88
|
+
GCA
|
89
|
+
GCT
|
90
|
+
GCC
|
91
|
+
GCG
|
92
|
+
GGA
|
93
|
+
GGT
|
94
|
+
GGC
|
95
|
+
GGG
|
96
|
+
)
|
97
|
+
compare_these_sequences.each {|this_sequence|
|
98
|
+
score = 0
|
99
|
+
chars = this_sequence.chars
|
100
|
+
first_char = chars[0]
|
101
|
+
second_char = chars[1]
|
102
|
+
third_char = chars[2]
|
103
|
+
if first_char == this_mer[0]
|
104
|
+
# =================================================================== #
|
105
|
+
# Found the first match.
|
106
|
+
# =================================================================== #
|
107
|
+
score += match_score
|
108
|
+
else
|
109
|
+
# =================================================================== #
|
110
|
+
# else it must be a mismatch
|
111
|
+
# =================================================================== #
|
112
|
+
score += mis_match_score
|
113
|
+
end
|
114
|
+
if second_char == this_mer[1]
|
115
|
+
# =================================================================== #
|
116
|
+
# Found the first match.
|
117
|
+
# =================================================================== #
|
118
|
+
score += match_score
|
119
|
+
else
|
120
|
+
# =================================================================== #
|
121
|
+
# else it must be a mismatch
|
122
|
+
# =================================================================== #
|
123
|
+
score += mis_match_score
|
124
|
+
end
|
125
|
+
if third_char == this_mer[2]
|
126
|
+
# =================================================================== #
|
127
|
+
# Found the first match.
|
128
|
+
# =================================================================== #
|
129
|
+
score += match_score
|
130
|
+
else
|
131
|
+
# =================================================================== #
|
132
|
+
# else it must be a mismatch
|
133
|
+
# =================================================================== #
|
134
|
+
score += mis_match_score
|
135
|
+
end
|
136
|
+
if optional_apply_filter_for_score_higher_than
|
137
|
+
if (score.to_i > optional_apply_filter_for_score_higher_than)
|
138
|
+
e "#{this_sequence}: score of "\
|
139
|
+
"#{score.to_s.rjust(3)}"
|
140
|
+
end
|
141
|
+
else
|
142
|
+
e this_sequence+': score of '+
|
143
|
+
score.to_s.rjust(3)
|
144
|
+
end
|
145
|
+
}
|
146
|
+
end
|
147
|
+
|
148
|
+
end
|
149
|
+
|
150
|
+
if __FILE__ == $PROGRAM_NAME
|
151
|
+
# Bioroebe.blast_neighborhood(ARGV)
|
152
|
+
Bioroebe.blast_neighborhood(ARGV, 1)
|
153
|
+
end # rb blast_neighb*
|
@@ -0,0 +1,57 @@
|
|
1
|
+
#!/usr/bin/ruby -w
|
2
|
+
# Encoding: UTF-8
|
3
|
+
# frozen_string_literal: true
|
4
|
+
# =========================================================================== #
|
5
|
+
# require 'bioroebe/toplevel_methods/calculate_n50_value.rb'
|
6
|
+
# Bioroebe.calculate_n50_value(ARGV)
|
7
|
+
# =========================================================================== #
|
8
|
+
module Bioroebe
|
9
|
+
|
10
|
+
# ========================================================================= #
|
11
|
+
# === Bioroebe.calculate_n50_value
|
12
|
+
#
|
13
|
+
# This method will calculate the N50 value of the given input. The input
|
14
|
+
# to this method should be a sorted Array.
|
15
|
+
# ========================================================================= #
|
16
|
+
def self.calculate_n50_value(
|
17
|
+
i = [
|
18
|
+
1989, 1934, 1841,
|
19
|
+
1785, 1737, 1649,
|
20
|
+
1361, 926, 848,
|
21
|
+
723
|
22
|
+
]
|
23
|
+
)
|
24
|
+
# ======================================================================= #
|
25
|
+
# The following conversion is necessary because ARGV will contain only
|
26
|
+
# String objects, not integer-values.
|
27
|
+
# ======================================================================= #
|
28
|
+
i.map! {|entry| entry.to_i }
|
29
|
+
calculate_sum_for_the_loop = 0
|
30
|
+
sum = i.sum
|
31
|
+
half = sum / 2.0
|
32
|
+
find_the_proper_contig = nil
|
33
|
+
i.each {|this_number|
|
34
|
+
calculate_sum_for_the_loop += this_number
|
35
|
+
# ===================================================================== #
|
36
|
+
# Compare the temporary sum with the half-sum.
|
37
|
+
# ===================================================================== #
|
38
|
+
if calculate_sum_for_the_loop > half
|
39
|
+
find_the_proper_contig = this_number
|
40
|
+
break
|
41
|
+
end
|
42
|
+
}
|
43
|
+
return find_the_proper_contig
|
44
|
+
end
|
45
|
+
|
46
|
+
end
|
47
|
+
|
48
|
+
if __FILE__ == $PROGRAM_NAME
|
49
|
+
if ARGV.empty?
|
50
|
+
pp Bioroebe.calculate_n50_value
|
51
|
+
array_to_test = [1252, 919, 917, 765, 711, 690, 632, 516, 463, 218]
|
52
|
+
pp array_to_test
|
53
|
+
pp Bioroebe.calculate_n50_value(array_to_test)
|
54
|
+
else
|
55
|
+
pp Bioroebe.calculate_n50_value(ARGV)
|
56
|
+
end
|
57
|
+
end # calculaten50value
|
@@ -0,0 +1,71 @@
|
|
1
|
+
#!/usr/bin/ruby -w
|
2
|
+
# Encoding: UTF-8
|
3
|
+
# frozen_string_literal: true
|
4
|
+
# =========================================================================== #
|
5
|
+
# require 'bioroebe/toplevel_methods/cat.rb'
|
6
|
+
# =========================================================================== #
|
7
|
+
module Bioroebe
|
8
|
+
|
9
|
+
require 'bioroebe/toplevel_methods/convert_global_env.rb'
|
10
|
+
require 'bioroebe/toplevel_methods/e.rb'
|
11
|
+
require 'bioroebe/colours/colours.rb'
|
12
|
+
require 'bioroebe/colours/rev.rb'
|
13
|
+
require 'bioroebe/colours/sfile.rb'
|
14
|
+
require 'bioroebe/colours/sdir.rb'
|
15
|
+
|
16
|
+
# ========================================================================= #
|
17
|
+
# === Bioroebe.cat (cat tag)
|
18
|
+
#
|
19
|
+
# A variant of cat to use here.
|
20
|
+
# ========================================================================= #
|
21
|
+
def self.cat(i = nil)
|
22
|
+
if i
|
23
|
+
i = convert_global_env(i) if i.include? '$'
|
24
|
+
i = Dir['*'][i.to_i - 1] if i =~ /^\d+$/
|
25
|
+
end
|
26
|
+
if i.nil?
|
27
|
+
erev 'Please provide an argument to Bioroebe.cat() (the name of a file)'
|
28
|
+
# ======================================================================= #
|
29
|
+
# === Handle directories next
|
30
|
+
# ======================================================================= #
|
31
|
+
elsif File.directory? i
|
32
|
+
erev "We can not read from `#{sdir(i)}#{rev}` as it is a directory."
|
33
|
+
# ======================================================================= #
|
34
|
+
# Else the File will exist in this clause:
|
35
|
+
# ======================================================================= #
|
36
|
+
elsif File.exist?(i)
|
37
|
+
_ = File.extname(i).delete('.')
|
38
|
+
case _ # case tag
|
39
|
+
# ===================================================================== #
|
40
|
+
# === fasta
|
41
|
+
# ===================================================================== #
|
42
|
+
when 'fasta',
|
43
|
+
'fa'
|
44
|
+
e 'This is a fasta file, so rather than cat-ing the content,'
|
45
|
+
e 'we will send this dataset to the ParseFasta class.'
|
46
|
+
require 'bioroebe/fasta_and_fastq/parse_fasta/parse_fasta.rb'
|
47
|
+
Bioroebe::ParseFasta.new(i)
|
48
|
+
else # The default here.
|
49
|
+
e "Now displaying the file `#{sfile(i)}`."
|
50
|
+
# e File.read(i)
|
51
|
+
# ^^^ Or we could use the above. We have to reconsider this one day.
|
52
|
+
File.readlines(i).each {|line| e " #{line.chomp}" } # With a bit of padding.
|
53
|
+
end
|
54
|
+
else # else the file does not exist.
|
55
|
+
e "#{swarn('Trying to display the file `')}#{sfile(i)}#{swarn('`')}"
|
56
|
+
e swarn('but it does not exist.')
|
57
|
+
end
|
58
|
+
end
|
59
|
+
|
60
|
+
# ========================================================================= #
|
61
|
+
# === cat
|
62
|
+
# ========================================================================= #
|
63
|
+
def cat(i)
|
64
|
+
::Bioroebe.cat(i)
|
65
|
+
end
|
66
|
+
|
67
|
+
end
|
68
|
+
|
69
|
+
if __FILE__ == $PROGRAM_NAME
|
70
|
+
Bioroebe.cat '/etc/wgetrc' # This is just for testing purposes really.
|
71
|
+
end # bioroebe_cat
|
@@ -0,0 +1,92 @@
|
|
1
|
+
#!/usr/bin/ruby -w
|
2
|
+
# Encoding: UTF-8
|
3
|
+
# frozen_string_literal: true
|
4
|
+
# =========================================================================== #
|
5
|
+
# This code will return a properly-chunked nucleotide sequence, with
|
6
|
+
# numbers.
|
7
|
+
#
|
8
|
+
# The genbank format uses such a chunked display.
|
9
|
+
#
|
10
|
+
# The display will look similar to this:
|
11
|
+
#
|
12
|
+
#
|
13
|
+
# 1 ATGGGGCCTG CAATGGGGCC TGCAATGGGG CCTGCAATGG GGCCTGCAAT GGGGCCTGCA
|
14
|
+
# 61 ATGGGGCCTG CAATGGGGCC TGCAATGGGG CCTGCA
|
15
|
+
#
|
16
|
+
#
|
17
|
+
# The chunks width defaults to the genbank format.
|
18
|
+
# =========================================================================== #
|
19
|
+
# require 'bioroebe/toplevel_methods/chunked_display.rb'
|
20
|
+
# puts Bioroebe.chunked_display(ARGV, 10)
|
21
|
+
# =========================================================================== #
|
22
|
+
module Bioroebe
|
23
|
+
|
24
|
+
require 'bioroebe/constants/newline.rb'
|
25
|
+
|
26
|
+
# ========================================================================= #
|
27
|
+
# === Bioroebe.return_nucleotide_sequence_as_ten_nucleotides_chunks
|
28
|
+
# ========================================================================= #
|
29
|
+
def self.return_nucleotide_sequence_as_ten_nucleotides_chunks(i)
|
30
|
+
i.split(/(.{10})/).reject(&:empty?)
|
31
|
+
end
|
32
|
+
|
33
|
+
# ========================================================================= #
|
34
|
+
# === Bioroebe.return_chunked_display
|
35
|
+
#
|
36
|
+
# The second argument to this method tells us how many nucleotides
|
37
|
+
# shall be grouped together (and then displayed as such).
|
38
|
+
# ========================================================================= #
|
39
|
+
def self.return_chunked_display(
|
40
|
+
i,
|
41
|
+
group_together_n_nucleotides = 10
|
42
|
+
)
|
43
|
+
i = i.first if i.is_a? Array
|
44
|
+
chunks = i.split(/(.{#{group_together_n_nucleotides}})/).reject(&:empty?)
|
45
|
+
sliced = chunks.each_slice(6).to_a
|
46
|
+
_ = ''.dup # We need a dynamic String.
|
47
|
+
sliced.each {|array|
|
48
|
+
# ===================================================================== #
|
49
|
+
# First, add the number to the beginning.
|
50
|
+
# ===================================================================== #
|
51
|
+
nucleotide_position = (
|
52
|
+
_.strip.tr(' ','').tr(N,'').gsub(/\d/,'').strip.size + 1
|
53
|
+
).to_s
|
54
|
+
_ << nucleotide_position.rjust(9)+' '
|
55
|
+
_ << array.join(' ')
|
56
|
+
_ << N
|
57
|
+
}
|
58
|
+
return _
|
59
|
+
end; self.instance_eval { alias chunked_display return_chunked_display } # === Bioroebe.chunked_display
|
60
|
+
|
61
|
+
# ========================================================================= #
|
62
|
+
# === Bioroebe.downcase_chunked_display
|
63
|
+
#
|
64
|
+
# This is similar to the regular chunked display, but will return
|
65
|
+
# the nucleotides in a downcased manner, aka "A" will become "a"
|
66
|
+
# and so forth.
|
67
|
+
#
|
68
|
+
# In the past this functionality resided in its own .rb file, but
|
69
|
+
# since as of March 2020 a bin/ executable was added, so that
|
70
|
+
# the functionality can be more easily called when the bioroebe
|
71
|
+
# gem is installed.
|
72
|
+
#
|
73
|
+
# Usage example:
|
74
|
+
#
|
75
|
+
# Bioroebe.downcase_chunked_display 'ATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCA'
|
76
|
+
#
|
77
|
+
# ========================================================================= #
|
78
|
+
def self.downcase_chunked_display(
|
79
|
+
i,
|
80
|
+
group_together_n_nucleotides = 10
|
81
|
+
)
|
82
|
+
sequence = ::Bioroebe.return_chunked_display(i, group_together_n_nucleotides).downcase
|
83
|
+
return sequence
|
84
|
+
end
|
85
|
+
|
86
|
+
end
|
87
|
+
|
88
|
+
if __FILE__ == $PROGRAM_NAME
|
89
|
+
puts Bioroebe.chunked_display(ARGV, 10)
|
90
|
+
puts Bioroebe.downcase_chunked_display(ARGV, 10)
|
91
|
+
end # chunkeddisplay ATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCA
|
92
|
+
# downcasechunkeddisplay ATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCAATGGGGCCTGCA
|