bioroebe 0.12.24 → 0.13.31
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/LICENSE.md +7 -8
- data/README.md +566 -354
- data/bin/all_positions_of_this_nucleotide +1 -1
- data/bin/aminoacid_frequencies +1 -1
- data/bin/automatically_rename_this_fasta_file +1 -1
- data/bin/base_composition +1 -1
- data/bin/batch_create_windows_executables +1 -1
- data/bin/bioroebe +12 -1
- data/bin/bioroebe_cat +7 -0
- data/bin/calculate_exponential_growth +7 -0
- data/bin/calculate_n50_value +1 -1
- data/bin/calculate_the_frequencies_of_this_species +7 -0
- data/bin/chunked_display +1 -1
- data/bin/codon_frequency +1 -1
- data/bin/codon_to_aminoacid +1 -1
- data/bin/colourize_this_fasta_sequence +1 -1
- data/bin/complementary_dna_strand +1 -1
- data/bin/complementary_rna_strand +1 -1
- data/bin/consensus_sequence +1 -1
- data/bin/dna_to_rna +1 -1
- data/bin/downcase_chunked_display +1 -1
- data/bin/download_this_pdb +1 -1
- data/bin/fasta_index +1 -1
- data/bin/fetch_data_from_uniprot +1 -1
- data/bin/filter_away_invalid_nucleotides +1 -1
- data/bin/find_substring +1 -1
- data/bin/input_as_dna +1 -1
- data/bin/is_palindrome +1 -1
- data/bin/leading_five_prime +1 -1
- data/bin/longest_ORF +1 -1
- data/bin/longest_substring +1 -1
- data/bin/open_reading_frames +1 -1
- data/bin/partner_nucleotide +1 -1
- data/bin/plain_palindrome +1 -1
- data/bin/random_dna_sequence +1 -1
- data/bin/random_sequence +1 -1
- data/bin/raw_hamming_distance +1 -1
- data/bin/return_longest_substring_via_LCS_algorithm +1 -1
- data/bin/reverse_sequence +1 -1
- data/bin/short_aminoacid_letter_from_long_aminoacid_name +1 -1
- data/bin/show_atomic_composition +1 -1
- data/bin/show_fasta_header +1 -1
- data/bin/show_nucleotide_sequence +1 -1
- data/bin/show_this_dna_sequence +1 -1
- data/bin/show_time_now +7 -0
- data/bin/sort_aminoacid_based_on_its_hydrophobicity +1 -1
- data/bin/strict_filter_away_invalid_aminoacids +1 -1
- data/{lib/bioroebe/base/reset.rb → bin/three_delimiter} +9 -6
- data/bin/three_to_one +1 -1
- data/bin/to_rna +1 -1
- data/bin/trailing_three_prime +1 -1
- data/bin/upcase_this_aminoacid_sequence_and_remove_numbers +1 -1
- data/bioroebe.gemspec +6 -7
- data/doc/README.gen +534 -322
- data/doc/blosum/blosum.md +4 -0
- data/doc/compatibility/BIO_PHP.md +20 -18
- data/doc/compatibility/README.md +2 -3
- data/doc/compatibility/emboss.md +5 -3
- data/doc/{extensive_usage_example.md → extensive_usage_example/extensive_usage_example.md} +4 -2
- data/doc/{instructions_for_the_taxonomy_subproject.md → instructions_for_the_taxonomy_subproject/instructions_for_the_taxonomy_subproject.md} +36 -33
- data/doc/{legacy_paths.md → legacy_paths/legacy_paths.md} +3 -3
- data/doc/statistics/statistics.md +12 -10
- data/doc/todo/bioroebe_GUI_todo.md +6 -1
- data/doc/todo/bioroebe_java_todo.md +3 -2
- data/doc/todo/bioroebe_todo.md +328 -310
- data/doc/{using_biomart.md → using_biomart/using_biomart.md} +7 -3
- data/lib/bioroebe/abstract/features.rb +0 -0
- data/lib/bioroebe/aminoacids/aminoacid_substitution.rb +1 -1
- data/lib/bioroebe/aminoacids/aminoacids_mass_table.rb +3 -1
- data/lib/bioroebe/aminoacids/codon_percentage.rb +18 -10
- data/lib/bioroebe/aminoacids/create_random_aminoacids.rb +5 -2
- data/lib/bioroebe/aminoacids/deduce_aminoacid_sequence.rb +90 -64
- data/lib/bioroebe/aminoacids/display_aminoacid_table.rb +1 -3
- data/lib/bioroebe/aminoacids/show_hydrophobicity.rb +2 -2
- data/lib/bioroebe/annotations/create_annotation_format.rb +2 -2
- data/lib/bioroebe/base/base.rb +101 -6
- data/lib/bioroebe/base/base_module/base_module.rb +9 -1
- data/lib/bioroebe/base/colours.rb +3 -0
- data/lib/bioroebe/base/colours_for_base/colours_for_base.rb +80 -44
- data/lib/bioroebe/base/commandline_application/README.md +1 -1
- data/lib/bioroebe/base/commandline_application/commandline_application.rb +661 -22
- data/lib/bioroebe/base/commandline_application/commandline_arguments.rb +2 -1
- data/lib/bioroebe/base/infer_the_namespace_module/infer_the_namespace_module.rb +37 -0
- data/lib/bioroebe/base/internal_hash_module/internal_hash_module.rb +1 -6
- data/lib/bioroebe/base/prototype/prototype.rb +155 -14
- data/lib/bioroebe/biomart/attribute.rb +1 -1
- data/lib/bioroebe/biomart/biomart.rb +8 -9
- data/lib/bioroebe/biomart/server.rb +1 -1
- data/lib/bioroebe/blosum/blosum.rb +2 -2
- data/lib/bioroebe/calculate/calculate_blosum_score.rb +5 -3
- data/lib/bioroebe/calculate/calculate_gc_content.rb +1 -1
- data/lib/bioroebe/calculate/calculate_levensthein_distance.rb +5 -3
- data/lib/bioroebe/calculate/calculate_melting_temperature.rb +2 -10
- data/lib/bioroebe/calculate/calculate_melting_temperature_for_more_than_thirteen_nucleotides.rb +6 -15
- data/lib/bioroebe/calculate/calculate_the_position_specific_scoring_matrix.rb +4 -2
- data/lib/bioroebe/cell/cell.rb +3 -2
- data/lib/bioroebe/cell/specialized_cells/B_cell.rb +60 -0
- data/lib/bioroebe/cell/specialized_cells/Macrophage.rb +60 -0
- data/lib/bioroebe/cell/specialized_cells/README.md +5 -0
- data/lib/bioroebe/cell/specialized_cells/T_cell.rb +60 -0
- data/lib/bioroebe/cleave_and_digest/cleave.rb +3 -1
- data/lib/bioroebe/cleave_and_digest/digestion.rb +1 -1
- data/lib/bioroebe/codon_tables/frequencies/10090_Mus_musculus.yml +93 -0
- data/lib/bioroebe/codon_tables/frequencies/107243_Thlaspi_caerulescens.yml +72 -0
- data/lib/bioroebe/codon_tables/frequencies/parse_frequency_table.rb +2 -2
- data/lib/bioroebe/codons/codon_table.rb +10 -2
- data/lib/bioroebe/codons/codons.rb +3 -3
- data/lib/bioroebe/codons/convert_this_codon_to_that_aminoacid.rb +18 -15
- data/lib/bioroebe/codons/determine_optimal_codons.rb +1 -1
- data/lib/bioroebe/codons/possible_codons_for_this_aminoacid.rb +4 -2
- data/lib/bioroebe/codons/show_codon_tables.rb +1 -1
- data/lib/bioroebe/codons/show_codon_usage.rb +1 -2
- data/lib/bioroebe/codons/show_this_codon_table.rb +2 -2
- data/lib/bioroebe/codons/start_codons.rb +7 -3
- data/lib/bioroebe/colours/colour_schemes/README.md +1 -1
- data/lib/bioroebe/colours/colour_schemes/array_available_colour_schemes.rb +3 -3
- data/lib/bioroebe/colours/colour_schemes/colour_scheme.rb +3 -3
- data/lib/bioroebe/colours/colour_schemes/colour_scheme_demo.rb +4 -3
- data/lib/bioroebe/colours/colour_schemes/helix.rb +3 -1
- data/lib/bioroebe/colours/colour_schemes/hydropathy.rb +3 -1
- data/lib/bioroebe/colours/colour_schemes/score.rb +13 -2
- data/lib/bioroebe/colours/colour_schemes/strand.rb +3 -1
- data/lib/bioroebe/colours/colour_schemes/turn.rb +3 -1
- data/lib/bioroebe/colours/colour_schemes/zappo.rb +1 -1
- data/lib/bioroebe/{toplevel_methods/colourize_related_methods.rb → colours/colourize_related_code.rb} +1 -3
- data/lib/bioroebe/colours/colourize_sequence.rb +3 -1
- data/lib/bioroebe/colours/colours.rb +172 -15
- data/lib/bioroebe/configuration/configuration.rb +1 -1
- data/lib/bioroebe/constants/GUIs.rb +2 -2
- data/lib/bioroebe/constants/constants.rb +1349 -0
- data/lib/bioroebe/conversions/convert_aminoacid_to_dna.rb +8 -13
- data/lib/bioroebe/conversions/dna_to_aminoacid_sequence.rb +9 -3
- data/lib/bioroebe/count/count_amount_of_aminoacids.rb +11 -10
- data/lib/bioroebe/count/count_amount_of_nucleotides.rb +1 -1
- data/lib/bioroebe/count/count_at.rb +2 -1
- data/lib/bioroebe/databases/download_taxonomy_database.rb +1 -1
- data/lib/bioroebe/dotplots/advanced_dotplot.rb +2 -2
- data/lib/bioroebe/electron_microscopy/coordinate_analyzer.rb +2 -2
- data/lib/bioroebe/electron_microscopy/fix_pos_file.rb +2 -2
- data/lib/bioroebe/electron_microscopy/flipy.rb +2 -2
- data/lib/bioroebe/electron_microscopy/generate_em2em_file.rb +3 -11
- data/lib/bioroebe/electron_microscopy/parse_coordinates.rb +6 -6
- data/lib/bioroebe/electron_microscopy/read_file_xmd.rb +6 -6
- data/lib/bioroebe/electron_microscopy/simple_star_file_generator.rb +2 -2
- data/lib/bioroebe/enzymes/has_this_restriction_enzyme.rb +1 -1
- data/lib/bioroebe/enzymes/restriction_enzyme.rb +1 -1
- data/lib/bioroebe/enzymes/restriction_enzymes/statistics.rb +4 -3
- data/lib/bioroebe/enzymes/restriction_enzymes_file.rb +1 -1
- data/lib/bioroebe/enzymes/return_sequence_that_is_cut_via_restriction_enzyme.rb +4 -3
- data/lib/bioroebe/enzymes/show_restriction_enzymes.rb +3 -3
- data/lib/bioroebe/ext/main.cpp +0 -1
- data/lib/bioroebe/fasta_and_fastq/autocorrect_the_name_of_this_fasta_file.rb +3 -3
- data/lib/bioroebe/fasta_and_fastq/compact_fasta_file/compact_fasta_file.rb +1 -1
- data/lib/bioroebe/fasta_and_fastq/display_how_many_fasta_entries_are_in_this_directory.rb +1 -1
- data/lib/bioroebe/fasta_and_fastq/download_fasta.rb +8 -14
- data/lib/bioroebe/fasta_and_fastq/fasta_defline/fasta_defline.rb +1 -1
- data/lib/bioroebe/fasta_and_fastq/fasta_to_yaml/fasta_to_yaml.rb +1 -1
- data/lib/bioroebe/fasta_and_fastq/fastq_format_explainer.rb +1 -1
- data/lib/bioroebe/fasta_and_fastq/length_modifier/length_modifier.rb +1 -1
- data/lib/bioroebe/fasta_and_fastq/parse_fasta/parse_fasta.rb +37 -11
- data/lib/bioroebe/fasta_and_fastq/parse_fastq/parse_fastq.rb +2 -2
- data/lib/bioroebe/fasta_and_fastq/return_fasta_subsection_of_this_file.rb +1 -1
- data/lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb +5 -13
- data/lib/bioroebe/fasta_and_fastq/show_fasta_statistics.rb +1 -1
- data/lib/bioroebe/fasta_and_fastq/simplify_fasta_header/simplify_fasta_header.rb +1 -1
- data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/reset.rb +3 -6
- data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/split_this_fasta_file_into_chromosomes.rb +3 -3
- data/lib/bioroebe/genbank/genbank_flat_file_format_generator.rb +20 -11
- data/lib/bioroebe/genome/genome.rb +1 -1
- data/lib/bioroebe/genomes/genome_pattern.rb +17 -16
- data/lib/bioroebe/genomes/genome_retriever.rb +4 -2
- data/lib/bioroebe/gui/experimental/snapgene/snapgene.rb +10 -13
- data/lib/bioroebe/gui/universal_widgets/alignment/alignment.rb +557 -0
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/aminoacid_composition/aminoacid_composition.rb +498 -198
- data/lib/bioroebe/gui/universal_widgets/anti_sense_strand/anti_sense_strand.rb +665 -0
- data/lib/bioroebe/gui/universal_widgets/blosum_matrix_viewer/blosum_matrix_viewer.rb +329 -0
- data/lib/bioroebe/gui/universal_widgets/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +423 -0
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/controller/controller.rb +170 -118
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +277 -215
- data/lib/bioroebe/gui/{shared_code/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget_module.rb → universal_widgets/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb} +297 -107
- data/lib/bioroebe/gui/universal_widgets/fasta_table_widget/fasta_table_widget.rb +643 -0
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/format_converter/format_converter.rb +236 -164
- data/lib/bioroebe/gui/universal_widgets/gene/gene.rb +278 -0
- data/lib/bioroebe/gui/universal_widgets/hamming_distance/hamming_distance.rb +646 -0
- data/lib/bioroebe/gui/{shared_code/levensthein_distance/levensthein_distance_module.rb → universal_widgets/levensthein_distance/levensthein_distance.rb} +313 -88
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/nucleotide_analyser/nucleotide_analyser.rb +281 -189
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/parse_pdb_file/parse_pdb_file.rb +265 -149
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/primer_design_widget/primer_design_widget.rb +337 -263
- data/lib/bioroebe/gui/universal_widgets/protein_to_DNA/protein_to_DNA.rb +408 -0
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/random_sequence/random_sequence.rb +245 -187
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/restriction_enzymes/restriction_enzymes.rb +207 -137
- data/lib/bioroebe/gui/universal_widgets/shell/shell.rb +288 -0
- data/lib/bioroebe/gui/{gtk3/show_codon_table/misc.rb → universal_widgets/show_codon_table/show_codon_table.rb} +290 -110
- data/lib/bioroebe/gui/{shared_code/show_codon_usage/show_codon_usage_module.rb → universal_widgets/show_codon_usage/show_codon_usage.rb} +228 -47
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/sizeseq/sizeseq.rb +151 -69
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/three_to_one/three_to_one.rb +190 -127
- data/lib/bioroebe/gui/{gtk3 → universal_widgets}/www_finder/www_finder.rb +211 -152
- data/lib/bioroebe/images/images.html +953 -1170
- data/lib/bioroebe/images/misc/README.md +6 -0
- data/lib/bioroebe/images/misc/activation.avif +0 -0
- data/lib/bioroebe/images/misc/inhibition.avif +0 -0
- data/lib/bioroebe/images/misc/small_virus_logo.avif +0 -0
- data/lib/bioroebe/{constants/base_directory.rb → log_directory/log_directory.rb} +79 -59
- data/lib/bioroebe/matplotlib/matplotlib_generator.rb +1 -1
- data/lib/bioroebe/misc/quiz/three_letter_to_aminoacid.rb +1 -1
- data/lib/bioroebe/misc/ruler.rb +5 -5
- data/lib/bioroebe/misc/useful_formulas.rb +3 -3
- data/lib/bioroebe/ncbi/efetch.rb +1 -2
- data/lib/bioroebe/ngs/phred_quality_score_table.rb +3 -3
- data/lib/bioroebe/nucleotides/complementary_dna_strand.rb +3 -6
- data/lib/bioroebe/nucleotides/molecular_weight_of_nucleotides.rb +3 -3
- data/lib/bioroebe/nucleotides/most_likely_nucleotide_sequence_for_this_aminoacid_sequence.rb +6 -10
- data/lib/bioroebe/nucleotides/{show_nucleotide_sequence.rb → show_nucleotide_sequence/show_nucleotide_sequence.rb} +377 -255
- data/lib/bioroebe/palindromes/palindrome_2D_structure.rb +1 -1
- data/lib/bioroebe/palindromes/palindrome_finder.rb +1 -1
- data/lib/bioroebe/palindromes/palindrome_generator.rb +2 -10
- data/lib/bioroebe/parsers/biolang_parser.rb +1 -1
- data/lib/bioroebe/parsers/blosum_parser.rb +14 -19
- data/lib/bioroebe/parsers/genbank_parser.rb +2 -6
- data/lib/bioroebe/parsers/gff.rb +9 -9
- data/lib/bioroebe/parsers/parse_embl.rb +2 -6
- data/lib/bioroebe/parsers/stride_parser.rb +4 -12
- data/lib/bioroebe/patterns/analyse_glycosylation_pattern.rb +2 -2
- data/lib/bioroebe/patterns/is_this_sequence_a_EGF2_pattern.rb +6 -3
- data/lib/bioroebe/patterns/profile_pattern.rb +2 -2
- data/lib/bioroebe/patterns/rgg_scanner.rb +4 -2
- data/lib/bioroebe/{protein_structure → pdb_and_protein_structure}/alpha_helix.rb +2 -2
- data/lib/bioroebe/{pdb → pdb_and_protein_structure}/download_this_pdb.rb +2 -3
- data/lib/bioroebe/{pdb → pdb_and_protein_structure}/fetch_fasta_sequence_from_pdb.rb +4 -4
- data/lib/bioroebe/{protein_structure → pdb_and_protein_structure}/helical_wheel.rb +2 -2
- data/lib/bioroebe/{pdb → pdb_and_protein_structure}/parse_mmCIF_file.rb +1 -1
- data/lib/bioroebe/{pdb → pdb_and_protein_structure}/parse_pdb_file.rb +3 -3
- data/lib/bioroebe/{pdb → pdb_and_protein_structure}/report_secondary_structures_from_this_pdb_file.rb +3 -3
- data/lib/bioroebe/project/project.rb +3 -1
- data/lib/bioroebe/raw_sequence/README.md +8 -8
- data/lib/bioroebe/raw_sequence/raw_sequence.rb +11 -2
- data/lib/bioroebe/regexes/regexes.rb +1 -2
- data/lib/bioroebe/requires/commandline_application.rb +3 -1
- data/lib/bioroebe/requires/require_all_pdb_files.rb +1 -1
- data/lib/bioroebe/requires/require_all_taxonomy_files.rb +1 -1
- data/lib/bioroebe/requires/require_all_utility_scripts_files.rb +10 -0
- data/lib/bioroebe/requires/require_colours.rb +1 -1
- data/lib/bioroebe/requires/require_the_bioroebe_project.rb +5 -7
- data/lib/bioroebe/requires/require_the_bioroebe_sinatra_components.rb +1 -1
- data/lib/bioroebe/requires/require_the_constants.rb +2 -14
- data/lib/bioroebe/requires/require_yaml.rb +7 -5
- data/lib/bioroebe/sequence/alignment.rb +1 -1
- data/lib/bioroebe/sequence/dna.rb +4 -2
- data/lib/bioroebe/sequence/nucleotide_module/nucleotide_module.rb +22 -8
- data/lib/bioroebe/sequence/protein.rb +2 -2
- data/lib/bioroebe/sequence/reverse_complement.rb +3 -3
- data/lib/bioroebe/sequence/rna.rb +9 -8
- data/lib/bioroebe/sequence/sequence.rb +3 -3
- data/lib/bioroebe/shell/configuration/additionally_set_xorg_buffer.yml +0 -0
- data/lib/bioroebe/shell/configuration/may_we_show_the_startup_information.yml +0 -0
- data/lib/bioroebe/shell/configuration/upcase_nucleotides.yml +0 -0
- data/lib/bioroebe/shell/configuration/use_silent_startup.yml +1 -1
- data/lib/bioroebe/shell/help/class.rb +68 -19
- data/lib/bioroebe/shell/menu.rb +5244 -5322
- data/lib/bioroebe/shell/{readline/readline.rb → readline.rb} +1 -3
- data/lib/bioroebe/shell/shell.rb +11240 -453
- data/lib/bioroebe/siRNA/siRNA.rb +3 -3
- data/lib/bioroebe/{gui/shared_code/blosum_matrix_viewer/blosum_matrix_viewer_module.rb → sinatra/sinatra_interface.rb} +28 -19
- data/lib/bioroebe/{www/sinatra/sinatra.rb → sinatra/sinatra_wrapper.rb} +731 -754
- data/lib/bioroebe/string_matching/find_longest_substring.rb +2 -10
- data/lib/bioroebe/string_matching/find_longest_substring_via_LCS_algorithm.rb +4 -14
- data/lib/bioroebe/string_matching/hamming_distance.rb +11 -10
- data/lib/bioroebe/string_matching/levensthein.rb +5 -17
- data/lib/bioroebe/string_matching/simple_string_comparer.rb +48 -4
- data/lib/bioroebe/string_matching/smith_waterman.rb +11 -6
- data/lib/bioroebe/svg/glyph.rb +4 -1
- data/lib/bioroebe/svg/mini_feature.rb +1 -1
- data/lib/bioroebe/svg/page.rb +18 -7
- data/lib/bioroebe/svg/svgee.rb +22 -13
- data/lib/bioroebe/svg/track.rb +20 -4
- data/lib/bioroebe/taxonomy/chart.rb +2 -2
- data/lib/bioroebe/taxonomy/class_methods.rb +5 -6
- data/lib/bioroebe/taxonomy/constants.rb +1 -1
- data/lib/bioroebe/taxonomy/info/info.rb +1 -1
- data/lib/bioroebe/taxonomy/info/is_dna.rb +1 -1
- data/lib/bioroebe/taxonomy/interactive.rb +1 -2
- data/lib/bioroebe/taxonomy/menu.rb +1 -1
- data/lib/bioroebe/taxonomy/node.rb +1 -1
- data/lib/bioroebe/taxonomy/parse_fasta.rb +4 -2
- data/lib/bioroebe/taxonomy/shared.rb +5 -4
- data/lib/bioroebe/taxonomy/taxonomy.rb +2 -4
- data/lib/bioroebe/toplevel_methods/fasta_and_fastq.rb +3 -45
- data/lib/bioroebe/toplevel_methods/{is_on_roebe.rb → roebe.rb} +1 -11
- data/lib/bioroebe/toplevel_methods/taxonomy.rb +6 -12
- data/lib/bioroebe/toplevel_methods/toplevel_methods.rb +5568 -0
- data/lib/bioroebe/utility_scripts/align_open_reading_frames.rb +4 -3
- data/lib/bioroebe/utility_scripts/analyse_local_dataset.rb +2 -2
- data/lib/bioroebe/utility_scripts/check_for_mismatches/check_for_mismatches.rb +16 -9
- data/lib/bioroebe/utility_scripts/compacter/compacter.rb +4 -2
- data/lib/bioroebe/utility_scripts/compare_these_two_sequences_via_blosum.rb +119 -0
- data/lib/bioroebe/utility_scripts/compseq/compseq.rb +11 -9
- data/lib/bioroebe/utility_scripts/{consensus_sequence.rb → consensus_sequence/consensus_sequence.rb} +13 -4
- data/lib/bioroebe/utility_scripts/{create_batch_entrez_file.rb → create_batch_entrez_file/create_batch_entrez_file.rb} +5 -5
- data/lib/bioroebe/utility_scripts/{determine_antigenic_areas.rb → determine_antigenic_areas/determine_antigenic_areas.rb} +5 -5
- data/lib/bioroebe/utility_scripts/{determine_missing_nucleotides_percentage.rb → determine_missing_nucleotides_percentage/determine_missing_nucleotides_percentage.rb} +16 -15
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/display_open_reading_frames.rb +7 -7
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/misc.rb +1 -1
- data/lib/bioroebe/utility_scripts/display_open_reading_frames/report.rb +2 -0
- data/lib/bioroebe/utility_scripts/{dot_alignment.rb → dot_alignment/dot_alignment.rb} +3 -3
- data/lib/bioroebe/utility_scripts/{download_files_from_rebase.rb → download_files_from_rebase/download_files_from_rebase.rb} +5 -5
- data/lib/bioroebe/utility_scripts/fetch_data_from_uniprot/fetch_data_from_uniprot.rb +269 -0
- data/lib/bioroebe/utility_scripts/find_gene.rb +4 -2
- data/lib/bioroebe/utility_scripts/{mirror_repeat.rb → mirror_repeat/mirror_repeat.rb} +5 -5
- data/lib/bioroebe/utility_scripts/move_file_to_its_correct_location.rb +3 -3
- data/lib/bioroebe/utility_scripts/{parse_taxonomy.rb → parse_taxonomy/parse_taxonomy.rb} +15 -6
- data/lib/bioroebe/utility_scripts/{pathways.rb → pathways/pathways.rb} +4 -3
- data/lib/bioroebe/utility_scripts/{permutations.rb → permutations/permutations.rb} +3 -3
- data/lib/bioroebe/utility_scripts/punnet/punnet.rb +4 -2
- data/lib/bioroebe/utility_scripts/{show_this_dna_sequence.rb → show_this_dna_sequence/show_this_dna_sequence.rb} +1 -1
- data/lib/bioroebe/utility_scripts/showorf/showorf.rb +406 -10
- data/lib/bioroebe/version/version.rb +2 -2
- data/lib/bioroebe/viennarna/rnafold_wrapper.rb +5 -13
- data/lib/bioroebe/virus/individual_viruses/README.md +15 -0
- data/lib/bioroebe/virus/individual_viruses/tobacco_mosaic_virus.rb +40 -0
- data/lib/bioroebe/virus/virus.rb +76 -0
- data/lib/bioroebe/www/bioroebe.cgi +4 -3
- data/lib/bioroebe/www/embeddable_interface.rb +85 -49
- data/lib/bioroebe/yaml/agarose/agarose_concentrations.yml +6 -6
- data/lib/bioroebe/yaml/antisense/antisense.yml +2 -0
- data/lib/bioroebe/yaml/blosum/blosum50.yml +6 -0
- data/lib/bioroebe/yaml/blosum/blosum90.yml +2 -1
- data/lib/bioroebe/yaml/chromosomes/chromosome_numbers.yml +2 -2
- data/lib/bioroebe/yaml/configuration/temp_dir.yml +1 -1
- data/lib/bioroebe/yaml/consensus_sequences/consensus_sequences.yml +1 -0
- data/lib/bioroebe/yaml/enzymes/enzyme_classes.yml +7 -6
- data/lib/bioroebe/yaml/humans/human_chromosomes.yml +3 -3
- data/lib/bioroebe/yaml/mRNA/mRNA.yml +1 -5
- data/lib/bioroebe/yaml/nucleotides/abbreviations_for_nucleotides.yml +1 -0
- data/lib/bioroebe/yaml/nucleotides/nucleotide_density.yml +2 -1
- data/lib/bioroebe/yaml/promoters/35S.yml +3 -1
- data/lib/bioroebe/yaml/proteases/proteases.yml +3 -1
- data/lib/bioroebe/yaml/proteins/ubiquitin.yml +4 -1
- data/lib/bioroebe/yaml/restriction_enzymes/restriction_enzymes.yml +7 -7
- data/spec/testing_toplevel_method_editor.rb +1 -1
- data/spec/testing_toplevel_method_verbose.rb +1 -1
- data/test/testing_dna_to_rna_conversion.rb +1 -1
- metadata +127 -235
- data/doc/blosum.md +0 -5
- data/lib/bioroebe/base/commandline_application/aminoacids.rb +0 -33
- data/lib/bioroebe/base/commandline_application/directory.rb +0 -33
- data/lib/bioroebe/base/commandline_application/extract.rb +0 -22
- data/lib/bioroebe/base/commandline_application/misc.rb +0 -502
- data/lib/bioroebe/base/commandline_application/opn.rb +0 -47
- data/lib/bioroebe/base/commandline_application/reset.rb +0 -42
- data/lib/bioroebe/base/commandline_application/warnings.rb +0 -36
- data/lib/bioroebe/base/commandline_application/write_what_into.rb +0 -29
- data/lib/bioroebe/base/initialize.rb +0 -18
- data/lib/bioroebe/base/misc.rb +0 -129
- data/lib/bioroebe/base/namespace.rb +0 -16
- data/lib/bioroebe/base/prototype/e_and_ee.rb +0 -24
- data/lib/bioroebe/base/prototype/misc.rb +0 -114
- data/lib/bioroebe/base/prototype/mkdir.rb +0 -20
- data/lib/bioroebe/base/prototype/reset.rb +0 -36
- data/lib/bioroebe/colours/misc_colours.rb +0 -80
- data/lib/bioroebe/colours/rev.rb +0 -44
- data/lib/bioroebe/colours/sdir.rb +0 -21
- data/lib/bioroebe/colours/sfancy.rb +0 -21
- data/lib/bioroebe/colours/sfile.rb +0 -21
- data/lib/bioroebe/colours/simp.rb +0 -21
- data/lib/bioroebe/colours/swarn.rb +0 -29
- data/lib/bioroebe/constants/aminoacids_and_proteins.rb +0 -147
- data/lib/bioroebe/constants/carriage_return.rb +0 -14
- data/lib/bioroebe/constants/codon_tables.rb +0 -77
- data/lib/bioroebe/constants/database_constants.rb +0 -107
- data/lib/bioroebe/constants/files_and_directories.rb +0 -606
- data/lib/bioroebe/constants/misc.rb +0 -209
- data/lib/bioroebe/constants/newline.rb +0 -14
- data/lib/bioroebe/constants/nucleotides.rb +0 -121
- data/lib/bioroebe/constants/regex.rb +0 -28
- data/lib/bioroebe/constants/roebe.rb +0 -38
- data/lib/bioroebe/constants/row_terminator.rb +0 -16
- data/lib/bioroebe/constants/tabulator.rb +0 -14
- data/lib/bioroebe/constants/unicode.rb +0 -12
- data/lib/bioroebe/constants/urls.rb +0 -50
- data/lib/bioroebe/gui/gtk +0 -1
- data/lib/bioroebe/gui/gtk3/README.md +0 -2
- data/lib/bioroebe/gui/gtk3/alignment/alignment.rb +0 -306
- data/lib/bioroebe/gui/gtk3/anti_sense_strand/anti_sense_strand.rb +0 -29
- data/lib/bioroebe/gui/gtk3/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -195
- data/lib/bioroebe/gui/gtk3/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +0 -105
- data/lib/bioroebe/gui/gtk3/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +0 -188
- data/lib/bioroebe/gui/gtk3/fasta_table_widget/fasta_table_widget.rb +0 -322
- data/lib/bioroebe/gui/gtk3/gene/gene.rb +0 -181
- data/lib/bioroebe/gui/gtk3/hamming_distance/hamming_distance.rb +0 -383
- data/lib/bioroebe/gui/gtk3/levensthein_distance/levensthein_distance.rb +0 -174
- data/lib/bioroebe/gui/gtk3/protein_to_DNA/protein_to_DNA.rb +0 -181
- data/lib/bioroebe/gui/gtk3/show_codon_table/show_codon_table.rb +0 -101
- data/lib/bioroebe/gui/gtk3/show_codon_usage/show_codon_usage.rb +0 -145
- data/lib/bioroebe/gui/gtk3/three_to_one/title.rb +0 -23
- data/lib/bioroebe/gui/jruby/alignment/alignment.rb +0 -165
- data/lib/bioroebe/gui/jruby/aminoacid_composition/aminoacid_composition.rb +0 -166
- data/lib/bioroebe/gui/jruby/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -82
- data/lib/bioroebe/gui/libui/README.md +0 -4
- data/lib/bioroebe/gui/libui/alignment/alignment.rb +0 -116
- data/lib/bioroebe/gui/libui/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -112
- data/lib/bioroebe/gui/libui/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +0 -60
- data/lib/bioroebe/gui/libui/controller/controller.rb +0 -116
- data/lib/bioroebe/gui/libui/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +0 -161
- data/lib/bioroebe/gui/libui/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +0 -76
- data/lib/bioroebe/gui/libui/hamming_distance/hamming_distance.rb +0 -135
- data/lib/bioroebe/gui/libui/levensthein_distance/levensthein_distance.rb +0 -118
- data/lib/bioroebe/gui/libui/protein_to_DNA/protein_to_DNA.rb +0 -115
- data/lib/bioroebe/gui/libui/random_sequence/random_sequence.rb +0 -190
- data/lib/bioroebe/gui/libui/show_codon_table/show_codon_table.rb +0 -134
- data/lib/bioroebe/gui/libui/show_codon_usage/show_codon_usage.rb +0 -89
- data/lib/bioroebe/gui/libui/three_to_one/three_to_one.rb +0 -113
- data/lib/bioroebe/gui/shared_code/alignment/alignment_module.rb +0 -102
- data/lib/bioroebe/gui/shared_code/aminoacid_composition/aminoacid_composition_module.rb +0 -94
- data/lib/bioroebe/gui/shared_code/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria_module.rb +0 -216
- data/lib/bioroebe/gui/shared_code/protein_to_DNA/protein_to_DNA_module.rb +0 -192
- data/lib/bioroebe/gui/shared_code/show_codon_table/show_codon_table_module.rb +0 -72
- data/lib/bioroebe/gui/tk/aminoacid_composition/aminoacid_composition.rb +0 -206
- data/lib/bioroebe/gui/tk/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -140
- data/lib/bioroebe/gui/tk/hamming_distance/hamming_distance.rb +0 -262
- data/lib/bioroebe/gui/tk/levensthein_distance/levensthein_distance.rb +0 -243
- data/lib/bioroebe/gui/tk/three_to_one/three_to_one.rb +0 -199
- data/lib/bioroebe/gui/unified_widgets/anti_sense_strand/anti_sense_strand.rb +0 -519
- data/lib/bioroebe/shell/colours/colours.rb +0 -235
- data/lib/bioroebe/shell/help/help.rb +0 -25
- data/lib/bioroebe/shell/misc.rb +0 -10227
- data/lib/bioroebe/toplevel_methods/ad_hoc_task.rb +0 -56
- data/lib/bioroebe/toplevel_methods/aminoacids_and_proteins.rb +0 -722
- data/lib/bioroebe/toplevel_methods/atomic_composition.rb +0 -198
- data/lib/bioroebe/toplevel_methods/base_composition.rb +0 -121
- data/lib/bioroebe/toplevel_methods/blast.rb +0 -153
- data/lib/bioroebe/toplevel_methods/calculate_n50_value.rb +0 -57
- data/lib/bioroebe/toplevel_methods/cat.rb +0 -71
- data/lib/bioroebe/toplevel_methods/chunked_display.rb +0 -92
- data/lib/bioroebe/toplevel_methods/cliner.rb +0 -81
- data/lib/bioroebe/toplevel_methods/complement.rb +0 -58
- data/lib/bioroebe/toplevel_methods/convert_global_env.rb +0 -39
- data/lib/bioroebe/toplevel_methods/databases.rb +0 -73
- data/lib/bioroebe/toplevel_methods/delimiter.rb +0 -19
- data/lib/bioroebe/toplevel_methods/digest.rb +0 -81
- data/lib/bioroebe/toplevel_methods/download_and_fetch_data.rb +0 -146
- data/lib/bioroebe/toplevel_methods/e.rb +0 -20
- data/lib/bioroebe/toplevel_methods/editor.rb +0 -21
- data/lib/bioroebe/toplevel_methods/esystem.rb +0 -22
- data/lib/bioroebe/toplevel_methods/exponential_growth.rb +0 -74
- data/lib/bioroebe/toplevel_methods/extract.rb +0 -56
- data/lib/bioroebe/toplevel_methods/file_and_directory_related_actions.rb +0 -269
- data/lib/bioroebe/toplevel_methods/frequencies.rb +0 -99
- data/lib/bioroebe/toplevel_methods/hamming_distance.rb +0 -60
- data/lib/bioroebe/toplevel_methods/infer.rb +0 -66
- data/lib/bioroebe/toplevel_methods/leading_five_prime_and_trailing_three_prime.rb +0 -101
- data/lib/bioroebe/toplevel_methods/levensthein.rb +0 -63
- data/lib/bioroebe/toplevel_methods/log_directory.rb +0 -109
- data/lib/bioroebe/toplevel_methods/longest_common_substring.rb +0 -55
- data/lib/bioroebe/toplevel_methods/map_ncbi_entry_to_eutils_id.rb +0 -88
- data/lib/bioroebe/toplevel_methods/matches.rb +0 -259
- data/lib/bioroebe/toplevel_methods/misc.rb +0 -596
- data/lib/bioroebe/toplevel_methods/nucleotides.rb +0 -787
- data/lib/bioroebe/toplevel_methods/number_of_clones.rb +0 -63
- data/lib/bioroebe/toplevel_methods/open_in_browser.rb +0 -79
- data/lib/bioroebe/toplevel_methods/open_reading_frames.rb +0 -236
- data/lib/bioroebe/toplevel_methods/opn.rb +0 -34
- data/lib/bioroebe/toplevel_methods/palindromes.rb +0 -155
- data/lib/bioroebe/toplevel_methods/parse.rb +0 -59
- data/lib/bioroebe/toplevel_methods/phred_error_probability.rb +0 -68
- data/lib/bioroebe/toplevel_methods/rds.rb +0 -24
- data/lib/bioroebe/toplevel_methods/remove.rb +0 -86
- data/lib/bioroebe/toplevel_methods/return_source_code_of_this_method.rb +0 -35
- data/lib/bioroebe/toplevel_methods/return_subsequence_based_on_indices.rb +0 -68
- data/lib/bioroebe/toplevel_methods/rna_splicing.rb +0 -73
- data/lib/bioroebe/toplevel_methods/rnalfold.rb +0 -69
- data/lib/bioroebe/toplevel_methods/searching_and_finding.rb +0 -116
- data/lib/bioroebe/toplevel_methods/shuffleseq.rb +0 -37
- data/lib/bioroebe/toplevel_methods/statistics.rb +0 -53
- data/lib/bioroebe/toplevel_methods/sum_of_odd_integers.rb +0 -62
- data/lib/bioroebe/toplevel_methods/three_delimiter.rb +0 -34
- data/lib/bioroebe/toplevel_methods/time_and_date.rb +0 -53
- data/lib/bioroebe/toplevel_methods/to_camelcase.rb +0 -31
- data/lib/bioroebe/toplevel_methods/truncate.rb +0 -48
- data/lib/bioroebe/toplevel_methods/url.rb +0 -36
- data/lib/bioroebe/toplevel_methods/verbose.rb +0 -59
- data/lib/bioroebe/utility_scripts/showorf/constants.rb +0 -31
- data/lib/bioroebe/utility_scripts/showorf/help.rb +0 -33
- data/lib/bioroebe/utility_scripts/showorf/initialize.rb +0 -52
- data/lib/bioroebe/utility_scripts/showorf/menu.rb +0 -68
- data/lib/bioroebe/utility_scripts/showorf/reset.rb +0 -36
- data/lib/bioroebe/utility_scripts/showorf/run.rb +0 -152
- data/lib/bioroebe/utility_scripts/showorf/show.rb +0 -97
- /data/doc/{german_names_for_the_aminoacids.md → german_names_for_the_aminoacids/german_names_for_the_aminoacids.md} +0 -0
- /data/doc/{pdb_ATOM_entry.md → pdb_ATOM_entry/pdb_ATOM_entry.md} +0 -0
- /data/doc/{resources.md → resources/resources.md} +0 -0
- /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/aminoacid_composition/customized_dialog.rb +0 -0
- /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/anti_sense_strand/anti_sense_strand.config +0 -0
- /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.config +0 -0
- /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.config +0 -0
- /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/hamming_distance/hamming_distance.config +0 -0
- /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/levensthein_distance/levensthein_distance.config +0 -0
- /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/protein_to_DNA/protein_to_DNA.config +0 -0
- /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/restriction_enzymes/restriction_enzymes.config +0 -0
- /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/www_finder/www_finder.config +0 -0
- /data/lib/bioroebe/yaml/{base_composition_of_dna.yml → base_composition_of_dna/base_composition_of_dna.yml} +0 -0
- /data/lib/bioroebe/yaml/{nuclear_localization_sequences.yml → nuclear_localization_sequences/nuclear_localization_sequences.yml} +0 -0
- /data/lib/bioroebe/yaml/{talens.yml → talens/talens.yml} +0 -0
@@ -1,68 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# require 'bioroebe/toplevel_methods/phred_error_probability.rb'
|
6
|
-
# Bioroebe.phred_error_probability(ARGV)
|
7
|
-
# =========================================================================== #
|
8
|
-
module Bioroebe
|
9
|
-
|
10
|
-
# ========================================================================= #
|
11
|
-
# === Bioroebe.phred_error_probability
|
12
|
-
#
|
13
|
-
# Datasets obtained from next-generation reads specify a Phred score
|
14
|
-
# for each base. This is also known as the "Q score" (Quality score).
|
15
|
-
#
|
16
|
-
# The Q score is an integer value, and is typically within the range 2
|
17
|
-
# to 40. Q indicates the probability that the base call is incorrect (P_e).
|
18
|
-
#
|
19
|
-
# For example, Q=2 means that the error probability is 63%, so the machine
|
20
|
-
# is reporting that the base is more likely to be wrong than right, while
|
21
|
-
# Q=20 corresponds to an error probability of only 1%.
|
22
|
-
#
|
23
|
-
# The second argument to this method can be used to format to a specific
|
24
|
-
# number. So if we pass in 6 as the second argument then the result will
|
25
|
-
# be rounded to 6 slots after the first '.'. See the usage examples
|
26
|
-
# below.
|
27
|
-
#
|
28
|
-
# Usage examples:
|
29
|
-
#
|
30
|
-
# Bioroebe.phred_error_probability '48'
|
31
|
-
# Bioroebe.phred_error_probability '48',6 # => "0.000016"
|
32
|
-
#
|
33
|
-
# ========================================================================= #
|
34
|
-
def self.phred_error_probability(
|
35
|
-
quality_score = 50,
|
36
|
-
optional_use_this_formatting = nil
|
37
|
-
)
|
38
|
-
if quality_score.is_a? Array
|
39
|
-
quality_score = quality_score.first
|
40
|
-
end
|
41
|
-
quality_score = quality_score.to_f # Need a Float past this point.
|
42
|
-
result = 10 ** (- quality_score / 10.0)
|
43
|
-
# ======================================================================= #
|
44
|
-
# Next, do some rounding if the user requested this through the
|
45
|
-
# second argument to this method.
|
46
|
-
# ======================================================================= #
|
47
|
-
if optional_use_this_formatting
|
48
|
-
if optional_use_this_formatting.is_a? Numeric
|
49
|
-
use_this_formatting_rule = "%.#{optional_use_this_formatting}f"
|
50
|
-
result = use_this_formatting_rule % result
|
51
|
-
else
|
52
|
-
result = optional_use_this_formatting.to_s % result
|
53
|
-
end
|
54
|
-
end
|
55
|
-
return result
|
56
|
-
end
|
57
|
-
|
58
|
-
end
|
59
|
-
|
60
|
-
if __FILE__ == $PROGRAM_NAME
|
61
|
-
if ARGV.empty?
|
62
|
-
(1 .. 40).each {|entry|
|
63
|
-
puts "#{entry.to_s.ljust(3)} #{Bioroebe.phred_error_probability(entry)}"
|
64
|
-
}
|
65
|
-
else
|
66
|
-
puts Bioroebe.phred_error_probability(ARGV)
|
67
|
-
end
|
68
|
-
end # phrederrorprobability 48
|
@@ -1,24 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# require 'bioroebe/toplevel_methods/rds.rb'
|
6
|
-
# =========================================================================== #
|
7
|
-
module Bioroebe
|
8
|
-
|
9
|
-
# ========================================================================= #
|
10
|
-
# === Bioroebe.rds
|
11
|
-
#
|
12
|
-
# rds is an abbreviation and is short for "remove double slashes".
|
13
|
-
#
|
14
|
-
# We will thus get rid of too many '/' tokens in a given string,
|
15
|
-
# via this method.
|
16
|
-
#
|
17
|
-
# This is mostly used in order to sanitize local file paths, as
|
18
|
-
# "foo//bar" entries look quite ugly.
|
19
|
-
# ========================================================================= #
|
20
|
-
def self.rds(i)
|
21
|
-
i.squeeze('/')
|
22
|
-
end
|
23
|
-
|
24
|
-
end
|
@@ -1,86 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# require 'bioroebe/toplevel_methods/remove.rb'
|
6
|
-
# Bioroebe.remove_numbers(ARGV)
|
7
|
-
# =========================================================================== #
|
8
|
-
module Bioroebe
|
9
|
-
|
10
|
-
# ========================================================================= #
|
11
|
-
# === Bioroebe.remove_numbers
|
12
|
-
#
|
13
|
-
# This method will simply remove numbers from the given input at hand.
|
14
|
-
#
|
15
|
-
# Usage example:
|
16
|
-
#
|
17
|
-
# Bioroebe.remove_numbers("abc123def")
|
18
|
-
#
|
19
|
-
# ========================================================================= #
|
20
|
-
def self.remove_numbers(i = ARGV)
|
21
|
-
if i.is_a? Array
|
22
|
-
i = i.join
|
23
|
-
end
|
24
|
-
i.gsub(/[0-9]/,'')
|
25
|
-
end; self.instance_eval { alias remove_numbers_from remove_numbers } # === Bioroebe.remove_numbers_from
|
26
|
-
|
27
|
-
# ========================================================================= #
|
28
|
-
# === Bioroebe.remove_subsequence
|
29
|
-
#
|
30
|
-
# This method will remove one or more subsequences from a given
|
31
|
-
# String at hand. The String that you wish to modify, should be
|
32
|
-
# given as the second argument to this method, called `from`.
|
33
|
-
#
|
34
|
-
# The first argument to this method can be an Array or a String - in
|
35
|
-
# either case, if the variable `from` contains this sequence, it
|
36
|
-
# will be removed.
|
37
|
-
#
|
38
|
-
# Note that only the FIRST occurence found will be removed - the others
|
39
|
-
# will be ignored, if they exist.
|
40
|
-
#
|
41
|
-
# The second argument to this method must be a String.
|
42
|
-
#
|
43
|
-
# Usage example:
|
44
|
-
#
|
45
|
-
# Bioroebe.remove_subsequence(["ATCGGTCGAA", "ATCGGTCGAGCGTGT"], 'ATGGTCTACATAGCTGACAAACAGCACGTAGCAATCGGTCGAATCTCGAGAGGCATATGGTCACATGATCGGTCGAGCGTGTTTCAAAGTTTGCGCCTAG')
|
46
|
-
# Bioroebe.remove_subsequence(array, main_sequence)
|
47
|
-
#
|
48
|
-
# ========================================================================= #
|
49
|
-
def self.remove_subsequence(
|
50
|
-
subsequence,
|
51
|
-
from # ← Must be a String.
|
52
|
-
)
|
53
|
-
unless from.is_a? String
|
54
|
-
raise 'Please input a String as second argument to this method.'
|
55
|
-
end
|
56
|
-
unless subsequence.is_a? Array
|
57
|
-
subsequence = [subsequence].flatten
|
58
|
-
end
|
59
|
-
from = from.dup if from.frozen?
|
60
|
-
subsequence.each {|this_subsequence|
|
61
|
-
from.sub!(/#{this_subsequence}/,'')
|
62
|
-
}
|
63
|
-
from # Return the, possibly modified, String here.
|
64
|
-
end; self.instance_eval { alias remove_subsequences remove_subsequence } # === Bioroebe.remove_subsequences
|
65
|
-
|
66
|
-
end
|
67
|
-
|
68
|
-
if __FILE__ == $PROGRAM_NAME
|
69
|
-
require 'colours/autoinclude'
|
70
|
-
alias e puts
|
71
|
-
main_sequence = 'ATGGTCTACATAGCTGACAAACAGCACGTAGCAATCGGTCGAATCTCGAGAGGCATATGGTCACATGATCGGTCGAGCGTGTTTCAAAGTTTGCGCCTAG'
|
72
|
-
subsequence1 = 'ATCGGTCGAA'
|
73
|
-
subsequence2 = 'ATCGGTCGAGCGTGT'
|
74
|
-
e "#{Colours.rev}The main sequence is:"
|
75
|
-
e
|
76
|
-
e " #{Colours.lightgreen(main_sequence)} (size: #{main_sequence.size})"
|
77
|
-
e
|
78
|
-
e 'The two subsequences '+Colours.slateblue(subsequence1)+
|
79
|
-
' and '+Colours.slateblue(subsequence2)+' will be removed next.'
|
80
|
-
e
|
81
|
-
e 'And now the resulting new String is:'
|
82
|
-
e
|
83
|
-
new_string = Bioroebe.remove_subsequence([subsequence1, subsequence2], main_sequence)
|
84
|
-
e " #{Colours.lightgreen(new_string)} (size: #{new_string.size})"
|
85
|
-
e
|
86
|
-
end # removesubsequence
|
@@ -1,35 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# require 'bioroebe/toplevel_methods/return_source_code_of_this_method.rb'
|
6
|
-
# Bioroebe.return_source_code_of_this_method
|
7
|
-
# =========================================================================== #
|
8
|
-
module Bioroebe
|
9
|
-
|
10
|
-
# ========================================================================= #
|
11
|
-
# === Bioroebe.return_source_code_of_this_method
|
12
|
-
#
|
13
|
-
# This method will return the source code of a particular method.
|
14
|
-
#
|
15
|
-
# Note that the method will stop at the first 'end' encountered.
|
16
|
-
# ========================================================================= #
|
17
|
-
def self.return_source_code_of_this_method(i)
|
18
|
-
if i.is_a? Array
|
19
|
-
i = i.first
|
20
|
-
end
|
21
|
-
content = i.source_location
|
22
|
-
full_content = File.readlines(
|
23
|
-
content[0].to_s
|
24
|
-
)[ (content[1]-1) .. -1 ].join.to_s
|
25
|
-
if full_content.include? 'end'
|
26
|
-
full_content = full_content[0 .. full_content.index('end')+2]
|
27
|
-
end
|
28
|
-
return full_content
|
29
|
-
end
|
30
|
-
|
31
|
-
end
|
32
|
-
|
33
|
-
if __FILE__ == $PROGRAM_NAME
|
34
|
-
Bioroebe.return_source_code_of_this_method
|
35
|
-
end
|
@@ -1,68 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# require 'bioroebe/toplevel_methods/return_subsequence_based_on_indices.rb'
|
6
|
-
# Bioroebe.return_subsequence_based_on_indices
|
7
|
-
# =========================================================================== #
|
8
|
-
module Bioroebe
|
9
|
-
|
10
|
-
# ========================================================================= #
|
11
|
-
# === Bioroebe.return_subsequence_based_on_indices
|
12
|
-
#
|
13
|
-
# This method will return a subsequence that was sliced out from the
|
14
|
-
# given input array of indices (the second argument to this method).
|
15
|
-
#
|
16
|
-
# This method here also allows us to read from an existing File. The
|
17
|
-
# format of that file has to be simple, though - the first line must
|
18
|
-
# be the sequence; and the second line will constitute the array
|
19
|
-
# of indices.
|
20
|
-
#
|
21
|
-
# For a usage example, see the end of this file here please. It has
|
22
|
-
# been written primarily to solve a specific task at Rosalind.
|
23
|
-
# ========================================================================= #
|
24
|
-
def self.return_subsequence_based_on_indices(
|
25
|
-
i, *array_of_indices
|
26
|
-
)
|
27
|
-
if array_of_indices.is_a? Array
|
28
|
-
array_of_indices.map! {|entry| entry.to_i }
|
29
|
-
end
|
30
|
-
result = ''.dup
|
31
|
-
if i and i.is_a?(String) and File.exist?(i)
|
32
|
-
dataset = File.readlines(i).reject {|line| line.strip.empty? }
|
33
|
-
i = dataset.first
|
34
|
-
array_of_indices = dataset.last.split(' ').map(&:to_i)
|
35
|
-
end
|
36
|
-
array_of_indices.each_slice(2).each {|a, b|
|
37
|
-
result << i[a .. b]+' '
|
38
|
-
}
|
39
|
-
result.strip
|
40
|
-
end
|
41
|
-
|
42
|
-
end
|
43
|
-
|
44
|
-
if __FILE__ == $PROGRAM_NAME
|
45
|
-
a = 22 # These four variables determine the sub-indices.
|
46
|
-
b = 27
|
47
|
-
c = 97
|
48
|
-
d = 102
|
49
|
-
if ARGV.empty?
|
50
|
-
test_this_string = 'HumptyDumptysatonawallHumptyDumpty'\
|
51
|
-
'hadagreatfallAlltheKingshorsesandalltheKingsmen'\
|
52
|
-
'CouldntputHumptyDumptyinhisplaceagain.'
|
53
|
-
else
|
54
|
-
test_this_string = ARGV.first
|
55
|
-
if test_this_string and File.file?(test_this_string)
|
56
|
-
dataset = File.readlines(test_this_string)
|
57
|
-
test_this_string = dataset.first
|
58
|
-
splitted = dataset.last.split(' ')
|
59
|
-
a = splitted[0]
|
60
|
-
b = splitted[1]
|
61
|
-
c = splitted[2]
|
62
|
-
d = splitted[3]
|
63
|
-
end
|
64
|
-
end
|
65
|
-
puts Bioroebe.return_subsequence_based_on_indices(
|
66
|
-
test_this_string, a, b, c, d
|
67
|
-
)
|
68
|
-
end # returnsubsequencebasedonindices /HUM.txt
|
@@ -1,73 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# require 'bioreobe/module_methods/rna_splicing.rb'
|
6
|
-
# =========================================================================== #
|
7
|
-
module Bioroebe
|
8
|
-
|
9
|
-
require 'bioroebe/toplevel_methods/remove.rb'
|
10
|
-
|
11
|
-
# ========================================================================= #
|
12
|
-
# === Bioroebe.rna_splicing
|
13
|
-
#
|
14
|
-
# This is a VERY primitive method that has been written primarily to
|
15
|
-
# solve a specific question on Rosalind.
|
16
|
-
#
|
17
|
-
# This is NOT how splicing normally works - but it works to solve
|
18
|
-
# the given question at Rosalind.
|
19
|
-
#
|
20
|
-
# Invocation example:
|
21
|
-
#
|
22
|
-
# Bioroebe.rna_splicing('/SPLICING.md')
|
23
|
-
#
|
24
|
-
# ========================================================================= #
|
25
|
-
def self.rna_splicing(i)
|
26
|
-
require 'bioroebe/fasta_and_fastq/parse_fasta/parse_fasta.rb'
|
27
|
-
if i and File.exist?(i)
|
28
|
-
# ===================================================================== #
|
29
|
-
# Read in the file should it exist.
|
30
|
-
# ===================================================================== #
|
31
|
-
i = File.read(i).strip
|
32
|
-
end
|
33
|
-
if i.is_a?(String) and i.include?('>')
|
34
|
-
_ = ::Bioroebe::ParseFasta.new(i) { :be_quiet }
|
35
|
-
sequences = _.sequences?
|
36
|
-
main_sequence = sequences.first
|
37
|
-
array_subsequences = sequences[1 .. -1]
|
38
|
-
result = ::Bioroebe.remove_subsequence(array_subsequences, main_sequence)
|
39
|
-
return result
|
40
|
-
end
|
41
|
-
end
|
42
|
-
|
43
|
-
end
|
44
|
-
|
45
|
-
if __FILE__ == $PROGRAM_NAME
|
46
|
-
alias e puts
|
47
|
-
if ARGV.empty?
|
48
|
-
use_this_dataset = '>Rosalind_10
|
49
|
-
ATGGTCTACATAGCTGACAAACAGCACGTAGCAATCGGTCGAATCTCGAGAGGCATATGGTCACATGATCGGTCGAGCGTGTTTCAAAGTTTGCGCCTAG
|
50
|
-
>Rosalind_12
|
51
|
-
ATCGGTCGAA
|
52
|
-
>Rosalind_15
|
53
|
-
ATCGGTCGAGCGTGT'
|
54
|
-
else
|
55
|
-
use_this_dataset = ARGV.first
|
56
|
-
end
|
57
|
-
e 'Original input is:'
|
58
|
-
e
|
59
|
-
e 'ATGGTCTACATAGCTGACAAACAGCACGTAGCAATCGGTCGAATCTCGAGAGGCATATGGTCACATGATCGGTCGAGCGTGTTTCAAAGTTTGCGCCTAG'
|
60
|
-
e
|
61
|
-
result = Bioroebe.rna_splicing use_this_dataset
|
62
|
-
e result
|
63
|
-
# ========================================================================= #
|
64
|
-
# The next code is if you need an aminoacid sequence:
|
65
|
-
# ========================================================================= #
|
66
|
-
e
|
67
|
-
e 'This corresponds to these aminoacids:'
|
68
|
-
e
|
69
|
-
e Bioroebe.to_aa(result)
|
70
|
-
e
|
71
|
-
end # rnasplicing
|
72
|
-
# rnasplicing /RNA_SPLICING.md
|
73
|
-
# rnasplicing /SPLICING.md
|
@@ -1,69 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# require 'bioroebe/toplevel_methods/rnalfold.rb'
|
6
|
-
# =========================================================================== #
|
7
|
-
module Bioroebe
|
8
|
-
|
9
|
-
require 'bioroebe/toplevel_methods/e.rb'
|
10
|
-
|
11
|
-
# ========================================================================= #
|
12
|
-
# === Bioroebe.rnalfold
|
13
|
-
#
|
14
|
-
# This method allows us to make use of RNALfold. By default the method
|
15
|
-
# will attempt to obtain all .fa files in the current directory; this
|
16
|
-
# should simplify batch-processing.
|
17
|
-
#
|
18
|
-
# Otherwise, the first input argument to this method should be the
|
19
|
-
# file(s) that you wish to manipulate.
|
20
|
-
#
|
21
|
-
# A typical usage example may be:
|
22
|
-
#
|
23
|
-
# Bioroebe.rnalfold { '--zscore=-3 -L 200' }
|
24
|
-
#
|
25
|
-
# ========================================================================= #
|
26
|
-
def self.rnalfold(
|
27
|
-
i = :use_all_fasta_files_in_the_current_directory
|
28
|
-
)
|
29
|
-
require 'bioroebe/colours/sfancy.rb'
|
30
|
-
require 'bioroebe/colours/sfile.rb'
|
31
|
-
# ======================================================================= #
|
32
|
-
# RNALfold will be used (as command).
|
33
|
-
# ======================================================================= #
|
34
|
-
use_this_command = 'RNALfold'.dup
|
35
|
-
case i
|
36
|
-
when :default,
|
37
|
-
:use_all_fasta_files_in_the_current_directory
|
38
|
-
i = Dir['**.fa']
|
39
|
-
end
|
40
|
-
if block_given?
|
41
|
-
yielded = yield
|
42
|
-
# ===================================================================== #
|
43
|
-
# Simply append these block-commands in that case:
|
44
|
-
# ===================================================================== #
|
45
|
-
use_this_command << " #{yielded}"
|
46
|
-
end
|
47
|
-
# ======================================================================= #
|
48
|
-
# We assume that our input is an Array past this point.
|
49
|
-
# ======================================================================= #
|
50
|
-
i.each {|this_file|
|
51
|
-
e "Working on `#{sfancy(this_file)}` next."
|
52
|
-
new_filename = this_file.dup
|
53
|
-
regex_to_use = /-L (\d+)/
|
54
|
-
use_this_command =~ regex_to_use
|
55
|
-
new_filename << '.'+$1.to_s.dup
|
56
|
-
new_filename << '.lfold'
|
57
|
-
_ = use_this_command+' < '+this_file+' > '+new_filename
|
58
|
-
esystem _
|
59
|
-
if File.exist? new_filename
|
60
|
-
e "A new file has been created at `#{sfile(new_filename)}`."
|
61
|
-
end
|
62
|
-
}
|
63
|
-
end
|
64
|
-
|
65
|
-
end
|
66
|
-
|
67
|
-
if __FILE__ == $PROGRAM_NAME
|
68
|
-
Bioroebe.rnalfold { '--zscore=-3 -L 200' }
|
69
|
-
end # bioroebernalfold
|
@@ -1,116 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# The file here will contain code that is related to "find"-ing something,
|
6
|
-
# typically within another string or object or dataset.
|
7
|
-
# =========================================================================== #
|
8
|
-
# require 'bioroebe/toplevel_methods/searching_and_finding.rb'
|
9
|
-
# Bioroebe.find_substring 'GATATATGCATATACTT', 'ATAT' # => [2, 4, 10]
|
10
|
-
# =========================================================================== #
|
11
|
-
module Bioroebe
|
12
|
-
|
13
|
-
# ========================================================================= #
|
14
|
-
# === Bioroebe.find_substring
|
15
|
-
#
|
16
|
-
# This method can be used to find a substring within a larger String.
|
17
|
-
#
|
18
|
-
# For example, in the below default values, the substring "ATAT"
|
19
|
-
# would exist at the positions 2, 4 and 10, if compared to the
|
20
|
-
# larger parent string "GATATATGCATATACTT".
|
21
|
-
#
|
22
|
-
# The following display may help you see this more easily, in
|
23
|
-
# regards to the substring matches:
|
24
|
-
#
|
25
|
-
# GATATATGCATATACTT
|
26
|
-
# ATATAT ATAT
|
27
|
-
#
|
28
|
-
# If you look closely, you will be able to see that "ATAT" can
|
29
|
-
# be found three times in the string above.
|
30
|
-
#
|
31
|
-
# Indices in this context start at position 1, not 0. This is
|
32
|
-
# mostly done to refer to nucleotides or aminoacids, which
|
33
|
-
# also typically start at the first letter. Position 0 makes
|
34
|
-
# no sense for a nucleotide - what would "nucleotide 0" even
|
35
|
-
# refer to?
|
36
|
-
#
|
37
|
-
# The first argument to this method may also be the path to a
|
38
|
-
# locally existing file, such as "/rosalind_subs.txt". In
|
39
|
-
# fact this method has been largely motivated by Rosalind
|
40
|
-
# tasks.
|
41
|
-
#
|
42
|
-
# The method will return an Array with the positions of all
|
43
|
-
# substrings that are found in the full_string variable. See
|
44
|
-
# the usage example below for how this may be.
|
45
|
-
#
|
46
|
-
# Usage example:
|
47
|
-
#
|
48
|
-
# Bioroebe.find_substring 'GATATATGCATATACTT', 'ATAT' # => [2, 4, 10]
|
49
|
-
#
|
50
|
-
# ========================================================================= #
|
51
|
-
def self.find_substring(
|
52
|
-
full_string = 'GATATATGCATATACTT', # ← The full String comes here.
|
53
|
-
this_substring = :default # ← The substring we are searching for comes here.
|
54
|
-
)
|
55
|
-
if full_string.is_a? Array
|
56
|
-
# ===================================================================== #
|
57
|
-
# Presently this method will only work on the first member of an Array.
|
58
|
-
# ===================================================================== #
|
59
|
-
full_string = full_string.first
|
60
|
-
end
|
61
|
-
if full_string and File.file?(full_string) and
|
62
|
-
this_substring == :default
|
63
|
-
# ===================================================================== #
|
64
|
-
# In this case it is ok to read from that file.
|
65
|
-
# ===================================================================== #
|
66
|
-
_ = File.read(full_string)
|
67
|
-
splitted = _.split("\n")
|
68
|
-
full_string = splitted.first
|
69
|
-
this_substring = splitted.last
|
70
|
-
end
|
71
|
-
case this_substring
|
72
|
-
# ======================================================================= #
|
73
|
-
# Use a default value in this case. In reality users should supply
|
74
|
-
# their own substring when they use this method here.
|
75
|
-
# ======================================================================= #
|
76
|
-
when :default,
|
77
|
-
nil
|
78
|
-
this_substring = 'ATAT'
|
79
|
-
else
|
80
|
-
if this_substring.empty?
|
81
|
-
this_substring = 'ATAT'
|
82
|
-
end
|
83
|
-
end
|
84
|
-
if full_string.nil? or full_string.empty?
|
85
|
-
full_string = 'GATATATGCATATACTT' # ← Use the default in this case.
|
86
|
-
end
|
87
|
-
result = Array.new.tap { |indexes|
|
88
|
-
final_index_position = full_string.size - this_substring.size
|
89
|
-
i = 0
|
90
|
-
while (i < final_index_position)
|
91
|
-
index = full_string.to_s.index(this_substring.to_s, i)
|
92
|
-
break if index.nil?
|
93
|
-
i = index + 1
|
94
|
-
indexes << i
|
95
|
-
end
|
96
|
-
}
|
97
|
-
result = nil if result.empty? # ← We will try this here; could also return an empty Array, though.
|
98
|
-
result # Return our findings here.
|
99
|
-
end; self.instance_eval { alias find_substring_indices find_substring } # === Bioroebe.find_substring_indices
|
100
|
-
|
101
|
-
end
|
102
|
-
|
103
|
-
if __FILE__ == $PROGRAM_NAME
|
104
|
-
if File.exist?(ARGV.first)
|
105
|
-
# ======================================================================= #
|
106
|
-
# Handle locally existing files first.
|
107
|
-
# ======================================================================= #
|
108
|
-
puts Bioroebe.find_substring(ARGV.first).join(' ').strip
|
109
|
-
else
|
110
|
-
puts Bioroebe.find_substring(ARGV[0], ARGV[1]).join(' ').strip
|
111
|
-
end
|
112
|
-
end # findsubstring TATATA AT
|
113
|
-
# findsubstring TATATATA AT
|
114
|
-
# findsubstring GATATATGCATATACTT ATAT
|
115
|
-
# findsubstring GATATATGCATATACTT ATAT
|
116
|
-
# findsubstring /rosalind_subs.txt
|
@@ -1,37 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# require 'bioroebe/toplevel_methods/shuffleseq.rb'
|
6
|
-
# Bioroebe.shuffleseq
|
7
|
-
# =========================================================================== #
|
8
|
-
module Bioroebe
|
9
|
-
|
10
|
-
# ========================================================================= #
|
11
|
-
# === Bioroebe.shuffleseq
|
12
|
-
#
|
13
|
-
# This method simulates the Emboss shuffleseq-functionality. It will
|
14
|
-
# take the input string, such as an assumed DNA sequence, and simply
|
15
|
-
# re-arrange it as-is.
|
16
|
-
#
|
17
|
-
# You can read this here:
|
18
|
-
#
|
19
|
-
# https://www.bioinformatics.nl/cgi-bin/emboss/shuffleseq
|
20
|
-
#
|
21
|
-
# Usage example:
|
22
|
-
#
|
23
|
-
# Bioroebe.shuffleseq 'ATCGATCG' # => "AGTTACGC"
|
24
|
-
#
|
25
|
-
# ========================================================================= #
|
26
|
-
def self.shuffleseq(i = ARGV)
|
27
|
-
if i.is_a? Array
|
28
|
-
i = i.join(' ').strip
|
29
|
-
end
|
30
|
-
return i.chars.shuffle.join
|
31
|
-
end; self.instance_eval { alias randomize_the_sequence shuffleseq } # === Bioroebe.randomize_the_sequence
|
32
|
-
|
33
|
-
end
|
34
|
-
|
35
|
-
if __FILE__ == $PROGRAM_NAME
|
36
|
-
puts Bioroebe.shuffleseq(ARGV)
|
37
|
-
end # shuffleseq ATCGATCG
|
@@ -1,53 +0,0 @@
|
|
1
|
-
#!/usr/bin/ruby -w
|
2
|
-
# Encoding: UTF-8
|
3
|
-
# frozen_string_literal: true
|
4
|
-
# =========================================================================== #
|
5
|
-
# require 'bioroebe/toplevel_methods/statistics.rb'
|
6
|
-
# Bioroebe.show_exon_statistics
|
7
|
-
# =========================================================================== #
|
8
|
-
module Bioroebe
|
9
|
-
|
10
|
-
require 'bioroebe/colours/colours.rb'
|
11
|
-
require 'bioroebe/toplevel_methods/e.rb'
|
12
|
-
require 'bioroebe/toplevel_methods/esystem.rb'
|
13
|
-
require 'bioroebe/toplevel_methods/file_and_directory_related_actions.rb'
|
14
|
-
|
15
|
-
# ========================================================================= #
|
16
|
-
# === Bioroebe.show_exon_statistics
|
17
|
-
#
|
18
|
-
# This is mostly "throw-away" code; it will quickly tell us how many
|
19
|
-
# exons may span over some junction.
|
20
|
-
#
|
21
|
-
# It was specifically created to analyze a .gtf file.
|
22
|
-
#
|
23
|
-
# Invocation example:
|
24
|
-
#
|
25
|
-
# bioroebe --show-exon-statistics-for=/tmp/praktikum/Mouse/chromosome_8/parsed/cdna.8.L100.global.gtf
|
26
|
-
#
|
27
|
-
# ========================================================================= #
|
28
|
-
def self.show_exon_statistics(these_files)
|
29
|
-
[these_files].flatten.compact.each {|this_file|
|
30
|
-
if File.exist? this_file
|
31
|
-
result = `cat #{this_file} | awk '{print $12}' | sort | uniq -c | sort -k1n | awk '{print $1}' | sort | uniq -c | less`
|
32
|
-
e gold(' n exons')
|
33
|
-
splitted = result.split("\n")
|
34
|
-
# =================================================================== #
|
35
|
-
# splitted may look like this:
|
36
|
-
#
|
37
|
-
# [" 89839 1", " 26031 2", " 1136 3", " 24 4"]
|
38
|
-
#
|
39
|
-
# =================================================================== #
|
40
|
-
splitted.each {|line|
|
41
|
-
e line.sub(/( \d+)$/, gold('\1'))
|
42
|
-
}
|
43
|
-
else
|
44
|
-
no_file_exists_at(this_file)
|
45
|
-
end
|
46
|
-
}
|
47
|
-
end
|
48
|
-
|
49
|
-
end
|
50
|
-
|
51
|
-
if __FILE__ == $PROGRAM_NAME
|
52
|
-
Bioroebe.show_exon_statistics(ARGV)
|
53
|
-
end # showexonstatistics /tmp/praktikum/Mouse/chromosome_8/parsed/cdna.8.L100.global.gtf
|