bioroebe 0.12.24 → 0.13.31

Sign up to get free protection for your applications and to get access to all the features.
Files changed (503) hide show
  1. checksums.yaml +4 -4
  2. data/LICENSE.md +7 -8
  3. data/README.md +566 -354
  4. data/bin/all_positions_of_this_nucleotide +1 -1
  5. data/bin/aminoacid_frequencies +1 -1
  6. data/bin/automatically_rename_this_fasta_file +1 -1
  7. data/bin/base_composition +1 -1
  8. data/bin/batch_create_windows_executables +1 -1
  9. data/bin/bioroebe +12 -1
  10. data/bin/bioroebe_cat +7 -0
  11. data/bin/calculate_exponential_growth +7 -0
  12. data/bin/calculate_n50_value +1 -1
  13. data/bin/calculate_the_frequencies_of_this_species +7 -0
  14. data/bin/chunked_display +1 -1
  15. data/bin/codon_frequency +1 -1
  16. data/bin/codon_to_aminoacid +1 -1
  17. data/bin/colourize_this_fasta_sequence +1 -1
  18. data/bin/complementary_dna_strand +1 -1
  19. data/bin/complementary_rna_strand +1 -1
  20. data/bin/consensus_sequence +1 -1
  21. data/bin/dna_to_rna +1 -1
  22. data/bin/downcase_chunked_display +1 -1
  23. data/bin/download_this_pdb +1 -1
  24. data/bin/fasta_index +1 -1
  25. data/bin/fetch_data_from_uniprot +1 -1
  26. data/bin/filter_away_invalid_nucleotides +1 -1
  27. data/bin/find_substring +1 -1
  28. data/bin/input_as_dna +1 -1
  29. data/bin/is_palindrome +1 -1
  30. data/bin/leading_five_prime +1 -1
  31. data/bin/longest_ORF +1 -1
  32. data/bin/longest_substring +1 -1
  33. data/bin/open_reading_frames +1 -1
  34. data/bin/partner_nucleotide +1 -1
  35. data/bin/plain_palindrome +1 -1
  36. data/bin/random_dna_sequence +1 -1
  37. data/bin/random_sequence +1 -1
  38. data/bin/raw_hamming_distance +1 -1
  39. data/bin/return_longest_substring_via_LCS_algorithm +1 -1
  40. data/bin/reverse_sequence +1 -1
  41. data/bin/short_aminoacid_letter_from_long_aminoacid_name +1 -1
  42. data/bin/show_atomic_composition +1 -1
  43. data/bin/show_fasta_header +1 -1
  44. data/bin/show_nucleotide_sequence +1 -1
  45. data/bin/show_this_dna_sequence +1 -1
  46. data/bin/show_time_now +7 -0
  47. data/bin/sort_aminoacid_based_on_its_hydrophobicity +1 -1
  48. data/bin/strict_filter_away_invalid_aminoacids +1 -1
  49. data/{lib/bioroebe/base/reset.rb → bin/three_delimiter} +9 -6
  50. data/bin/three_to_one +1 -1
  51. data/bin/to_rna +1 -1
  52. data/bin/trailing_three_prime +1 -1
  53. data/bin/upcase_this_aminoacid_sequence_and_remove_numbers +1 -1
  54. data/bioroebe.gemspec +6 -7
  55. data/doc/README.gen +534 -322
  56. data/doc/blosum/blosum.md +4 -0
  57. data/doc/compatibility/BIO_PHP.md +20 -18
  58. data/doc/compatibility/README.md +2 -3
  59. data/doc/compatibility/emboss.md +5 -3
  60. data/doc/{extensive_usage_example.md → extensive_usage_example/extensive_usage_example.md} +4 -2
  61. data/doc/{instructions_for_the_taxonomy_subproject.md → instructions_for_the_taxonomy_subproject/instructions_for_the_taxonomy_subproject.md} +36 -33
  62. data/doc/{legacy_paths.md → legacy_paths/legacy_paths.md} +3 -3
  63. data/doc/statistics/statistics.md +12 -10
  64. data/doc/todo/bioroebe_GUI_todo.md +6 -1
  65. data/doc/todo/bioroebe_java_todo.md +3 -2
  66. data/doc/todo/bioroebe_todo.md +328 -310
  67. data/doc/{using_biomart.md → using_biomart/using_biomart.md} +7 -3
  68. data/lib/bioroebe/abstract/features.rb +0 -0
  69. data/lib/bioroebe/aminoacids/aminoacid_substitution.rb +1 -1
  70. data/lib/bioroebe/aminoacids/aminoacids_mass_table.rb +3 -1
  71. data/lib/bioroebe/aminoacids/codon_percentage.rb +18 -10
  72. data/lib/bioroebe/aminoacids/create_random_aminoacids.rb +5 -2
  73. data/lib/bioroebe/aminoacids/deduce_aminoacid_sequence.rb +90 -64
  74. data/lib/bioroebe/aminoacids/display_aminoacid_table.rb +1 -3
  75. data/lib/bioroebe/aminoacids/show_hydrophobicity.rb +2 -2
  76. data/lib/bioroebe/annotations/create_annotation_format.rb +2 -2
  77. data/lib/bioroebe/base/base.rb +101 -6
  78. data/lib/bioroebe/base/base_module/base_module.rb +9 -1
  79. data/lib/bioroebe/base/colours.rb +3 -0
  80. data/lib/bioroebe/base/colours_for_base/colours_for_base.rb +80 -44
  81. data/lib/bioroebe/base/commandline_application/README.md +1 -1
  82. data/lib/bioroebe/base/commandline_application/commandline_application.rb +661 -22
  83. data/lib/bioroebe/base/commandline_application/commandline_arguments.rb +2 -1
  84. data/lib/bioroebe/base/infer_the_namespace_module/infer_the_namespace_module.rb +37 -0
  85. data/lib/bioroebe/base/internal_hash_module/internal_hash_module.rb +1 -6
  86. data/lib/bioroebe/base/prototype/prototype.rb +155 -14
  87. data/lib/bioroebe/biomart/attribute.rb +1 -1
  88. data/lib/bioroebe/biomart/biomart.rb +8 -9
  89. data/lib/bioroebe/biomart/server.rb +1 -1
  90. data/lib/bioroebe/blosum/blosum.rb +2 -2
  91. data/lib/bioroebe/calculate/calculate_blosum_score.rb +5 -3
  92. data/lib/bioroebe/calculate/calculate_gc_content.rb +1 -1
  93. data/lib/bioroebe/calculate/calculate_levensthein_distance.rb +5 -3
  94. data/lib/bioroebe/calculate/calculate_melting_temperature.rb +2 -10
  95. data/lib/bioroebe/calculate/calculate_melting_temperature_for_more_than_thirteen_nucleotides.rb +6 -15
  96. data/lib/bioroebe/calculate/calculate_the_position_specific_scoring_matrix.rb +4 -2
  97. data/lib/bioroebe/cell/cell.rb +3 -2
  98. data/lib/bioroebe/cell/specialized_cells/B_cell.rb +60 -0
  99. data/lib/bioroebe/cell/specialized_cells/Macrophage.rb +60 -0
  100. data/lib/bioroebe/cell/specialized_cells/README.md +5 -0
  101. data/lib/bioroebe/cell/specialized_cells/T_cell.rb +60 -0
  102. data/lib/bioroebe/cleave_and_digest/cleave.rb +3 -1
  103. data/lib/bioroebe/cleave_and_digest/digestion.rb +1 -1
  104. data/lib/bioroebe/codon_tables/frequencies/10090_Mus_musculus.yml +93 -0
  105. data/lib/bioroebe/codon_tables/frequencies/107243_Thlaspi_caerulescens.yml +72 -0
  106. data/lib/bioroebe/codon_tables/frequencies/parse_frequency_table.rb +2 -2
  107. data/lib/bioroebe/codons/codon_table.rb +10 -2
  108. data/lib/bioroebe/codons/codons.rb +3 -3
  109. data/lib/bioroebe/codons/convert_this_codon_to_that_aminoacid.rb +18 -15
  110. data/lib/bioroebe/codons/determine_optimal_codons.rb +1 -1
  111. data/lib/bioroebe/codons/possible_codons_for_this_aminoacid.rb +4 -2
  112. data/lib/bioroebe/codons/show_codon_tables.rb +1 -1
  113. data/lib/bioroebe/codons/show_codon_usage.rb +1 -2
  114. data/lib/bioroebe/codons/show_this_codon_table.rb +2 -2
  115. data/lib/bioroebe/codons/start_codons.rb +7 -3
  116. data/lib/bioroebe/colours/colour_schemes/README.md +1 -1
  117. data/lib/bioroebe/colours/colour_schemes/array_available_colour_schemes.rb +3 -3
  118. data/lib/bioroebe/colours/colour_schemes/colour_scheme.rb +3 -3
  119. data/lib/bioroebe/colours/colour_schemes/colour_scheme_demo.rb +4 -3
  120. data/lib/bioroebe/colours/colour_schemes/helix.rb +3 -1
  121. data/lib/bioroebe/colours/colour_schemes/hydropathy.rb +3 -1
  122. data/lib/bioroebe/colours/colour_schemes/score.rb +13 -2
  123. data/lib/bioroebe/colours/colour_schemes/strand.rb +3 -1
  124. data/lib/bioroebe/colours/colour_schemes/turn.rb +3 -1
  125. data/lib/bioroebe/colours/colour_schemes/zappo.rb +1 -1
  126. data/lib/bioroebe/{toplevel_methods/colourize_related_methods.rb → colours/colourize_related_code.rb} +1 -3
  127. data/lib/bioroebe/colours/colourize_sequence.rb +3 -1
  128. data/lib/bioroebe/colours/colours.rb +172 -15
  129. data/lib/bioroebe/configuration/configuration.rb +1 -1
  130. data/lib/bioroebe/constants/GUIs.rb +2 -2
  131. data/lib/bioroebe/constants/constants.rb +1349 -0
  132. data/lib/bioroebe/conversions/convert_aminoacid_to_dna.rb +8 -13
  133. data/lib/bioroebe/conversions/dna_to_aminoacid_sequence.rb +9 -3
  134. data/lib/bioroebe/count/count_amount_of_aminoacids.rb +11 -10
  135. data/lib/bioroebe/count/count_amount_of_nucleotides.rb +1 -1
  136. data/lib/bioroebe/count/count_at.rb +2 -1
  137. data/lib/bioroebe/databases/download_taxonomy_database.rb +1 -1
  138. data/lib/bioroebe/dotplots/advanced_dotplot.rb +2 -2
  139. data/lib/bioroebe/electron_microscopy/coordinate_analyzer.rb +2 -2
  140. data/lib/bioroebe/electron_microscopy/fix_pos_file.rb +2 -2
  141. data/lib/bioroebe/electron_microscopy/flipy.rb +2 -2
  142. data/lib/bioroebe/electron_microscopy/generate_em2em_file.rb +3 -11
  143. data/lib/bioroebe/electron_microscopy/parse_coordinates.rb +6 -6
  144. data/lib/bioroebe/electron_microscopy/read_file_xmd.rb +6 -6
  145. data/lib/bioroebe/electron_microscopy/simple_star_file_generator.rb +2 -2
  146. data/lib/bioroebe/enzymes/has_this_restriction_enzyme.rb +1 -1
  147. data/lib/bioroebe/enzymes/restriction_enzyme.rb +1 -1
  148. data/lib/bioroebe/enzymes/restriction_enzymes/statistics.rb +4 -3
  149. data/lib/bioroebe/enzymes/restriction_enzymes_file.rb +1 -1
  150. data/lib/bioroebe/enzymes/return_sequence_that_is_cut_via_restriction_enzyme.rb +4 -3
  151. data/lib/bioroebe/enzymes/show_restriction_enzymes.rb +3 -3
  152. data/lib/bioroebe/ext/main.cpp +0 -1
  153. data/lib/bioroebe/fasta_and_fastq/autocorrect_the_name_of_this_fasta_file.rb +3 -3
  154. data/lib/bioroebe/fasta_and_fastq/compact_fasta_file/compact_fasta_file.rb +1 -1
  155. data/lib/bioroebe/fasta_and_fastq/display_how_many_fasta_entries_are_in_this_directory.rb +1 -1
  156. data/lib/bioroebe/fasta_and_fastq/download_fasta.rb +8 -14
  157. data/lib/bioroebe/fasta_and_fastq/fasta_defline/fasta_defline.rb +1 -1
  158. data/lib/bioroebe/fasta_and_fastq/fasta_to_yaml/fasta_to_yaml.rb +1 -1
  159. data/lib/bioroebe/fasta_and_fastq/fastq_format_explainer.rb +1 -1
  160. data/lib/bioroebe/fasta_and_fastq/length_modifier/length_modifier.rb +1 -1
  161. data/lib/bioroebe/fasta_and_fastq/parse_fasta/parse_fasta.rb +37 -11
  162. data/lib/bioroebe/fasta_and_fastq/parse_fastq/parse_fastq.rb +2 -2
  163. data/lib/bioroebe/fasta_and_fastq/return_fasta_subsection_of_this_file.rb +1 -1
  164. data/lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb +5 -13
  165. data/lib/bioroebe/fasta_and_fastq/show_fasta_statistics.rb +1 -1
  166. data/lib/bioroebe/fasta_and_fastq/simplify_fasta_header/simplify_fasta_header.rb +1 -1
  167. data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/reset.rb +3 -6
  168. data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/split_this_fasta_file_into_chromosomes.rb +3 -3
  169. data/lib/bioroebe/genbank/genbank_flat_file_format_generator.rb +20 -11
  170. data/lib/bioroebe/genome/genome.rb +1 -1
  171. data/lib/bioroebe/genomes/genome_pattern.rb +17 -16
  172. data/lib/bioroebe/genomes/genome_retriever.rb +4 -2
  173. data/lib/bioroebe/gui/experimental/snapgene/snapgene.rb +10 -13
  174. data/lib/bioroebe/gui/universal_widgets/alignment/alignment.rb +557 -0
  175. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/aminoacid_composition/aminoacid_composition.rb +498 -198
  176. data/lib/bioroebe/gui/universal_widgets/anti_sense_strand/anti_sense_strand.rb +665 -0
  177. data/lib/bioroebe/gui/universal_widgets/blosum_matrix_viewer/blosum_matrix_viewer.rb +329 -0
  178. data/lib/bioroebe/gui/universal_widgets/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +423 -0
  179. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/controller/controller.rb +170 -118
  180. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +277 -215
  181. data/lib/bioroebe/gui/{shared_code/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget_module.rb → universal_widgets/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb} +297 -107
  182. data/lib/bioroebe/gui/universal_widgets/fasta_table_widget/fasta_table_widget.rb +643 -0
  183. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/format_converter/format_converter.rb +236 -164
  184. data/lib/bioroebe/gui/universal_widgets/gene/gene.rb +278 -0
  185. data/lib/bioroebe/gui/universal_widgets/hamming_distance/hamming_distance.rb +646 -0
  186. data/lib/bioroebe/gui/{shared_code/levensthein_distance/levensthein_distance_module.rb → universal_widgets/levensthein_distance/levensthein_distance.rb} +313 -88
  187. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/nucleotide_analyser/nucleotide_analyser.rb +281 -189
  188. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/parse_pdb_file/parse_pdb_file.rb +265 -149
  189. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/primer_design_widget/primer_design_widget.rb +337 -263
  190. data/lib/bioroebe/gui/universal_widgets/protein_to_DNA/protein_to_DNA.rb +408 -0
  191. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/random_sequence/random_sequence.rb +245 -187
  192. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/restriction_enzymes/restriction_enzymes.rb +207 -137
  193. data/lib/bioroebe/gui/universal_widgets/shell/shell.rb +288 -0
  194. data/lib/bioroebe/gui/{gtk3/show_codon_table/misc.rb → universal_widgets/show_codon_table/show_codon_table.rb} +290 -110
  195. data/lib/bioroebe/gui/{shared_code/show_codon_usage/show_codon_usage_module.rb → universal_widgets/show_codon_usage/show_codon_usage.rb} +228 -47
  196. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/sizeseq/sizeseq.rb +151 -69
  197. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/three_to_one/three_to_one.rb +190 -127
  198. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/www_finder/www_finder.rb +211 -152
  199. data/lib/bioroebe/images/images.html +953 -1170
  200. data/lib/bioroebe/images/misc/README.md +6 -0
  201. data/lib/bioroebe/images/misc/activation.avif +0 -0
  202. data/lib/bioroebe/images/misc/inhibition.avif +0 -0
  203. data/lib/bioroebe/images/misc/small_virus_logo.avif +0 -0
  204. data/lib/bioroebe/{constants/base_directory.rb → log_directory/log_directory.rb} +79 -59
  205. data/lib/bioroebe/matplotlib/matplotlib_generator.rb +1 -1
  206. data/lib/bioroebe/misc/quiz/three_letter_to_aminoacid.rb +1 -1
  207. data/lib/bioroebe/misc/ruler.rb +5 -5
  208. data/lib/bioroebe/misc/useful_formulas.rb +3 -3
  209. data/lib/bioroebe/ncbi/efetch.rb +1 -2
  210. data/lib/bioroebe/ngs/phred_quality_score_table.rb +3 -3
  211. data/lib/bioroebe/nucleotides/complementary_dna_strand.rb +3 -6
  212. data/lib/bioroebe/nucleotides/molecular_weight_of_nucleotides.rb +3 -3
  213. data/lib/bioroebe/nucleotides/most_likely_nucleotide_sequence_for_this_aminoacid_sequence.rb +6 -10
  214. data/lib/bioroebe/nucleotides/{show_nucleotide_sequence.rb → show_nucleotide_sequence/show_nucleotide_sequence.rb} +377 -255
  215. data/lib/bioroebe/palindromes/palindrome_2D_structure.rb +1 -1
  216. data/lib/bioroebe/palindromes/palindrome_finder.rb +1 -1
  217. data/lib/bioroebe/palindromes/palindrome_generator.rb +2 -10
  218. data/lib/bioroebe/parsers/biolang_parser.rb +1 -1
  219. data/lib/bioroebe/parsers/blosum_parser.rb +14 -19
  220. data/lib/bioroebe/parsers/genbank_parser.rb +2 -6
  221. data/lib/bioroebe/parsers/gff.rb +9 -9
  222. data/lib/bioroebe/parsers/parse_embl.rb +2 -6
  223. data/lib/bioroebe/parsers/stride_parser.rb +4 -12
  224. data/lib/bioroebe/patterns/analyse_glycosylation_pattern.rb +2 -2
  225. data/lib/bioroebe/patterns/is_this_sequence_a_EGF2_pattern.rb +6 -3
  226. data/lib/bioroebe/patterns/profile_pattern.rb +2 -2
  227. data/lib/bioroebe/patterns/rgg_scanner.rb +4 -2
  228. data/lib/bioroebe/{protein_structure → pdb_and_protein_structure}/alpha_helix.rb +2 -2
  229. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/download_this_pdb.rb +2 -3
  230. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/fetch_fasta_sequence_from_pdb.rb +4 -4
  231. data/lib/bioroebe/{protein_structure → pdb_and_protein_structure}/helical_wheel.rb +2 -2
  232. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/parse_mmCIF_file.rb +1 -1
  233. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/parse_pdb_file.rb +3 -3
  234. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/report_secondary_structures_from_this_pdb_file.rb +3 -3
  235. data/lib/bioroebe/project/project.rb +3 -1
  236. data/lib/bioroebe/raw_sequence/README.md +8 -8
  237. data/lib/bioroebe/raw_sequence/raw_sequence.rb +11 -2
  238. data/lib/bioroebe/regexes/regexes.rb +1 -2
  239. data/lib/bioroebe/requires/commandline_application.rb +3 -1
  240. data/lib/bioroebe/requires/require_all_pdb_files.rb +1 -1
  241. data/lib/bioroebe/requires/require_all_taxonomy_files.rb +1 -1
  242. data/lib/bioroebe/requires/require_all_utility_scripts_files.rb +10 -0
  243. data/lib/bioroebe/requires/require_colours.rb +1 -1
  244. data/lib/bioroebe/requires/require_the_bioroebe_project.rb +5 -7
  245. data/lib/bioroebe/requires/require_the_bioroebe_sinatra_components.rb +1 -1
  246. data/lib/bioroebe/requires/require_the_constants.rb +2 -14
  247. data/lib/bioroebe/requires/require_yaml.rb +7 -5
  248. data/lib/bioroebe/sequence/alignment.rb +1 -1
  249. data/lib/bioroebe/sequence/dna.rb +4 -2
  250. data/lib/bioroebe/sequence/nucleotide_module/nucleotide_module.rb +22 -8
  251. data/lib/bioroebe/sequence/protein.rb +2 -2
  252. data/lib/bioroebe/sequence/reverse_complement.rb +3 -3
  253. data/lib/bioroebe/sequence/rna.rb +9 -8
  254. data/lib/bioroebe/sequence/sequence.rb +3 -3
  255. data/lib/bioroebe/shell/configuration/additionally_set_xorg_buffer.yml +0 -0
  256. data/lib/bioroebe/shell/configuration/may_we_show_the_startup_information.yml +0 -0
  257. data/lib/bioroebe/shell/configuration/upcase_nucleotides.yml +0 -0
  258. data/lib/bioroebe/shell/configuration/use_silent_startup.yml +1 -1
  259. data/lib/bioroebe/shell/help/class.rb +68 -19
  260. data/lib/bioroebe/shell/menu.rb +5244 -5322
  261. data/lib/bioroebe/shell/{readline/readline.rb → readline.rb} +1 -3
  262. data/lib/bioroebe/shell/shell.rb +11240 -453
  263. data/lib/bioroebe/siRNA/siRNA.rb +3 -3
  264. data/lib/bioroebe/{gui/shared_code/blosum_matrix_viewer/blosum_matrix_viewer_module.rb → sinatra/sinatra_interface.rb} +28 -19
  265. data/lib/bioroebe/{www/sinatra/sinatra.rb → sinatra/sinatra_wrapper.rb} +731 -754
  266. data/lib/bioroebe/string_matching/find_longest_substring.rb +2 -10
  267. data/lib/bioroebe/string_matching/find_longest_substring_via_LCS_algorithm.rb +4 -14
  268. data/lib/bioroebe/string_matching/hamming_distance.rb +11 -10
  269. data/lib/bioroebe/string_matching/levensthein.rb +5 -17
  270. data/lib/bioroebe/string_matching/simple_string_comparer.rb +48 -4
  271. data/lib/bioroebe/string_matching/smith_waterman.rb +11 -6
  272. data/lib/bioroebe/svg/glyph.rb +4 -1
  273. data/lib/bioroebe/svg/mini_feature.rb +1 -1
  274. data/lib/bioroebe/svg/page.rb +18 -7
  275. data/lib/bioroebe/svg/svgee.rb +22 -13
  276. data/lib/bioroebe/svg/track.rb +20 -4
  277. data/lib/bioroebe/taxonomy/chart.rb +2 -2
  278. data/lib/bioroebe/taxonomy/class_methods.rb +5 -6
  279. data/lib/bioroebe/taxonomy/constants.rb +1 -1
  280. data/lib/bioroebe/taxonomy/info/info.rb +1 -1
  281. data/lib/bioroebe/taxonomy/info/is_dna.rb +1 -1
  282. data/lib/bioroebe/taxonomy/interactive.rb +1 -2
  283. data/lib/bioroebe/taxonomy/menu.rb +1 -1
  284. data/lib/bioroebe/taxonomy/node.rb +1 -1
  285. data/lib/bioroebe/taxonomy/parse_fasta.rb +4 -2
  286. data/lib/bioroebe/taxonomy/shared.rb +5 -4
  287. data/lib/bioroebe/taxonomy/taxonomy.rb +2 -4
  288. data/lib/bioroebe/toplevel_methods/fasta_and_fastq.rb +3 -45
  289. data/lib/bioroebe/toplevel_methods/{is_on_roebe.rb → roebe.rb} +1 -11
  290. data/lib/bioroebe/toplevel_methods/taxonomy.rb +6 -12
  291. data/lib/bioroebe/toplevel_methods/toplevel_methods.rb +5568 -0
  292. data/lib/bioroebe/utility_scripts/align_open_reading_frames.rb +4 -3
  293. data/lib/bioroebe/utility_scripts/analyse_local_dataset.rb +2 -2
  294. data/lib/bioroebe/utility_scripts/check_for_mismatches/check_for_mismatches.rb +16 -9
  295. data/lib/bioroebe/utility_scripts/compacter/compacter.rb +4 -2
  296. data/lib/bioroebe/utility_scripts/compare_these_two_sequences_via_blosum.rb +119 -0
  297. data/lib/bioroebe/utility_scripts/compseq/compseq.rb +11 -9
  298. data/lib/bioroebe/utility_scripts/{consensus_sequence.rb → consensus_sequence/consensus_sequence.rb} +13 -4
  299. data/lib/bioroebe/utility_scripts/{create_batch_entrez_file.rb → create_batch_entrez_file/create_batch_entrez_file.rb} +5 -5
  300. data/lib/bioroebe/utility_scripts/{determine_antigenic_areas.rb → determine_antigenic_areas/determine_antigenic_areas.rb} +5 -5
  301. data/lib/bioroebe/utility_scripts/{determine_missing_nucleotides_percentage.rb → determine_missing_nucleotides_percentage/determine_missing_nucleotides_percentage.rb} +16 -15
  302. data/lib/bioroebe/utility_scripts/display_open_reading_frames/display_open_reading_frames.rb +7 -7
  303. data/lib/bioroebe/utility_scripts/display_open_reading_frames/misc.rb +1 -1
  304. data/lib/bioroebe/utility_scripts/display_open_reading_frames/report.rb +2 -0
  305. data/lib/bioroebe/utility_scripts/{dot_alignment.rb → dot_alignment/dot_alignment.rb} +3 -3
  306. data/lib/bioroebe/utility_scripts/{download_files_from_rebase.rb → download_files_from_rebase/download_files_from_rebase.rb} +5 -5
  307. data/lib/bioroebe/utility_scripts/fetch_data_from_uniprot/fetch_data_from_uniprot.rb +269 -0
  308. data/lib/bioroebe/utility_scripts/find_gene.rb +4 -2
  309. data/lib/bioroebe/utility_scripts/{mirror_repeat.rb → mirror_repeat/mirror_repeat.rb} +5 -5
  310. data/lib/bioroebe/utility_scripts/move_file_to_its_correct_location.rb +3 -3
  311. data/lib/bioroebe/utility_scripts/{parse_taxonomy.rb → parse_taxonomy/parse_taxonomy.rb} +15 -6
  312. data/lib/bioroebe/utility_scripts/{pathways.rb → pathways/pathways.rb} +4 -3
  313. data/lib/bioroebe/utility_scripts/{permutations.rb → permutations/permutations.rb} +3 -3
  314. data/lib/bioroebe/utility_scripts/punnet/punnet.rb +4 -2
  315. data/lib/bioroebe/utility_scripts/{show_this_dna_sequence.rb → show_this_dna_sequence/show_this_dna_sequence.rb} +1 -1
  316. data/lib/bioroebe/utility_scripts/showorf/showorf.rb +406 -10
  317. data/lib/bioroebe/version/version.rb +2 -2
  318. data/lib/bioroebe/viennarna/rnafold_wrapper.rb +5 -13
  319. data/lib/bioroebe/virus/individual_viruses/README.md +15 -0
  320. data/lib/bioroebe/virus/individual_viruses/tobacco_mosaic_virus.rb +40 -0
  321. data/lib/bioroebe/virus/virus.rb +76 -0
  322. data/lib/bioroebe/www/bioroebe.cgi +4 -3
  323. data/lib/bioroebe/www/embeddable_interface.rb +85 -49
  324. data/lib/bioroebe/yaml/agarose/agarose_concentrations.yml +6 -6
  325. data/lib/bioroebe/yaml/antisense/antisense.yml +2 -0
  326. data/lib/bioroebe/yaml/blosum/blosum50.yml +6 -0
  327. data/lib/bioroebe/yaml/blosum/blosum90.yml +2 -1
  328. data/lib/bioroebe/yaml/chromosomes/chromosome_numbers.yml +2 -2
  329. data/lib/bioroebe/yaml/configuration/temp_dir.yml +1 -1
  330. data/lib/bioroebe/yaml/consensus_sequences/consensus_sequences.yml +1 -0
  331. data/lib/bioroebe/yaml/enzymes/enzyme_classes.yml +7 -6
  332. data/lib/bioroebe/yaml/humans/human_chromosomes.yml +3 -3
  333. data/lib/bioroebe/yaml/mRNA/mRNA.yml +1 -5
  334. data/lib/bioroebe/yaml/nucleotides/abbreviations_for_nucleotides.yml +1 -0
  335. data/lib/bioroebe/yaml/nucleotides/nucleotide_density.yml +2 -1
  336. data/lib/bioroebe/yaml/promoters/35S.yml +3 -1
  337. data/lib/bioroebe/yaml/proteases/proteases.yml +3 -1
  338. data/lib/bioroebe/yaml/proteins/ubiquitin.yml +4 -1
  339. data/lib/bioroebe/yaml/restriction_enzymes/restriction_enzymes.yml +7 -7
  340. data/spec/testing_toplevel_method_editor.rb +1 -1
  341. data/spec/testing_toplevel_method_verbose.rb +1 -1
  342. data/test/testing_dna_to_rna_conversion.rb +1 -1
  343. metadata +127 -235
  344. data/doc/blosum.md +0 -5
  345. data/lib/bioroebe/base/commandline_application/aminoacids.rb +0 -33
  346. data/lib/bioroebe/base/commandline_application/directory.rb +0 -33
  347. data/lib/bioroebe/base/commandline_application/extract.rb +0 -22
  348. data/lib/bioroebe/base/commandline_application/misc.rb +0 -502
  349. data/lib/bioroebe/base/commandline_application/opn.rb +0 -47
  350. data/lib/bioroebe/base/commandline_application/reset.rb +0 -42
  351. data/lib/bioroebe/base/commandline_application/warnings.rb +0 -36
  352. data/lib/bioroebe/base/commandline_application/write_what_into.rb +0 -29
  353. data/lib/bioroebe/base/initialize.rb +0 -18
  354. data/lib/bioroebe/base/misc.rb +0 -129
  355. data/lib/bioroebe/base/namespace.rb +0 -16
  356. data/lib/bioroebe/base/prototype/e_and_ee.rb +0 -24
  357. data/lib/bioroebe/base/prototype/misc.rb +0 -114
  358. data/lib/bioroebe/base/prototype/mkdir.rb +0 -20
  359. data/lib/bioroebe/base/prototype/reset.rb +0 -36
  360. data/lib/bioroebe/colours/misc_colours.rb +0 -80
  361. data/lib/bioroebe/colours/rev.rb +0 -44
  362. data/lib/bioroebe/colours/sdir.rb +0 -21
  363. data/lib/bioroebe/colours/sfancy.rb +0 -21
  364. data/lib/bioroebe/colours/sfile.rb +0 -21
  365. data/lib/bioroebe/colours/simp.rb +0 -21
  366. data/lib/bioroebe/colours/swarn.rb +0 -29
  367. data/lib/bioroebe/constants/aminoacids_and_proteins.rb +0 -147
  368. data/lib/bioroebe/constants/carriage_return.rb +0 -14
  369. data/lib/bioroebe/constants/codon_tables.rb +0 -77
  370. data/lib/bioroebe/constants/database_constants.rb +0 -107
  371. data/lib/bioroebe/constants/files_and_directories.rb +0 -606
  372. data/lib/bioroebe/constants/misc.rb +0 -209
  373. data/lib/bioroebe/constants/newline.rb +0 -14
  374. data/lib/bioroebe/constants/nucleotides.rb +0 -121
  375. data/lib/bioroebe/constants/regex.rb +0 -28
  376. data/lib/bioroebe/constants/roebe.rb +0 -38
  377. data/lib/bioroebe/constants/row_terminator.rb +0 -16
  378. data/lib/bioroebe/constants/tabulator.rb +0 -14
  379. data/lib/bioroebe/constants/unicode.rb +0 -12
  380. data/lib/bioroebe/constants/urls.rb +0 -50
  381. data/lib/bioroebe/gui/gtk +0 -1
  382. data/lib/bioroebe/gui/gtk3/README.md +0 -2
  383. data/lib/bioroebe/gui/gtk3/alignment/alignment.rb +0 -306
  384. data/lib/bioroebe/gui/gtk3/anti_sense_strand/anti_sense_strand.rb +0 -29
  385. data/lib/bioroebe/gui/gtk3/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -195
  386. data/lib/bioroebe/gui/gtk3/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +0 -105
  387. data/lib/bioroebe/gui/gtk3/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +0 -188
  388. data/lib/bioroebe/gui/gtk3/fasta_table_widget/fasta_table_widget.rb +0 -322
  389. data/lib/bioroebe/gui/gtk3/gene/gene.rb +0 -181
  390. data/lib/bioroebe/gui/gtk3/hamming_distance/hamming_distance.rb +0 -383
  391. data/lib/bioroebe/gui/gtk3/levensthein_distance/levensthein_distance.rb +0 -174
  392. data/lib/bioroebe/gui/gtk3/protein_to_DNA/protein_to_DNA.rb +0 -181
  393. data/lib/bioroebe/gui/gtk3/show_codon_table/show_codon_table.rb +0 -101
  394. data/lib/bioroebe/gui/gtk3/show_codon_usage/show_codon_usage.rb +0 -145
  395. data/lib/bioroebe/gui/gtk3/three_to_one/title.rb +0 -23
  396. data/lib/bioroebe/gui/jruby/alignment/alignment.rb +0 -165
  397. data/lib/bioroebe/gui/jruby/aminoacid_composition/aminoacid_composition.rb +0 -166
  398. data/lib/bioroebe/gui/jruby/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -82
  399. data/lib/bioroebe/gui/libui/README.md +0 -4
  400. data/lib/bioroebe/gui/libui/alignment/alignment.rb +0 -116
  401. data/lib/bioroebe/gui/libui/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -112
  402. data/lib/bioroebe/gui/libui/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +0 -60
  403. data/lib/bioroebe/gui/libui/controller/controller.rb +0 -116
  404. data/lib/bioroebe/gui/libui/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +0 -161
  405. data/lib/bioroebe/gui/libui/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +0 -76
  406. data/lib/bioroebe/gui/libui/hamming_distance/hamming_distance.rb +0 -135
  407. data/lib/bioroebe/gui/libui/levensthein_distance/levensthein_distance.rb +0 -118
  408. data/lib/bioroebe/gui/libui/protein_to_DNA/protein_to_DNA.rb +0 -115
  409. data/lib/bioroebe/gui/libui/random_sequence/random_sequence.rb +0 -190
  410. data/lib/bioroebe/gui/libui/show_codon_table/show_codon_table.rb +0 -134
  411. data/lib/bioroebe/gui/libui/show_codon_usage/show_codon_usage.rb +0 -89
  412. data/lib/bioroebe/gui/libui/three_to_one/three_to_one.rb +0 -113
  413. data/lib/bioroebe/gui/shared_code/alignment/alignment_module.rb +0 -102
  414. data/lib/bioroebe/gui/shared_code/aminoacid_composition/aminoacid_composition_module.rb +0 -94
  415. data/lib/bioroebe/gui/shared_code/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria_module.rb +0 -216
  416. data/lib/bioroebe/gui/shared_code/protein_to_DNA/protein_to_DNA_module.rb +0 -192
  417. data/lib/bioroebe/gui/shared_code/show_codon_table/show_codon_table_module.rb +0 -72
  418. data/lib/bioroebe/gui/tk/aminoacid_composition/aminoacid_composition.rb +0 -206
  419. data/lib/bioroebe/gui/tk/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -140
  420. data/lib/bioroebe/gui/tk/hamming_distance/hamming_distance.rb +0 -262
  421. data/lib/bioroebe/gui/tk/levensthein_distance/levensthein_distance.rb +0 -243
  422. data/lib/bioroebe/gui/tk/three_to_one/three_to_one.rb +0 -199
  423. data/lib/bioroebe/gui/unified_widgets/anti_sense_strand/anti_sense_strand.rb +0 -519
  424. data/lib/bioroebe/shell/colours/colours.rb +0 -235
  425. data/lib/bioroebe/shell/help/help.rb +0 -25
  426. data/lib/bioroebe/shell/misc.rb +0 -10227
  427. data/lib/bioroebe/toplevel_methods/ad_hoc_task.rb +0 -56
  428. data/lib/bioroebe/toplevel_methods/aminoacids_and_proteins.rb +0 -722
  429. data/lib/bioroebe/toplevel_methods/atomic_composition.rb +0 -198
  430. data/lib/bioroebe/toplevel_methods/base_composition.rb +0 -121
  431. data/lib/bioroebe/toplevel_methods/blast.rb +0 -153
  432. data/lib/bioroebe/toplevel_methods/calculate_n50_value.rb +0 -57
  433. data/lib/bioroebe/toplevel_methods/cat.rb +0 -71
  434. data/lib/bioroebe/toplevel_methods/chunked_display.rb +0 -92
  435. data/lib/bioroebe/toplevel_methods/cliner.rb +0 -81
  436. data/lib/bioroebe/toplevel_methods/complement.rb +0 -58
  437. data/lib/bioroebe/toplevel_methods/convert_global_env.rb +0 -39
  438. data/lib/bioroebe/toplevel_methods/databases.rb +0 -73
  439. data/lib/bioroebe/toplevel_methods/delimiter.rb +0 -19
  440. data/lib/bioroebe/toplevel_methods/digest.rb +0 -81
  441. data/lib/bioroebe/toplevel_methods/download_and_fetch_data.rb +0 -146
  442. data/lib/bioroebe/toplevel_methods/e.rb +0 -20
  443. data/lib/bioroebe/toplevel_methods/editor.rb +0 -21
  444. data/lib/bioroebe/toplevel_methods/esystem.rb +0 -22
  445. data/lib/bioroebe/toplevel_methods/exponential_growth.rb +0 -74
  446. data/lib/bioroebe/toplevel_methods/extract.rb +0 -56
  447. data/lib/bioroebe/toplevel_methods/file_and_directory_related_actions.rb +0 -269
  448. data/lib/bioroebe/toplevel_methods/frequencies.rb +0 -99
  449. data/lib/bioroebe/toplevel_methods/hamming_distance.rb +0 -60
  450. data/lib/bioroebe/toplevel_methods/infer.rb +0 -66
  451. data/lib/bioroebe/toplevel_methods/leading_five_prime_and_trailing_three_prime.rb +0 -101
  452. data/lib/bioroebe/toplevel_methods/levensthein.rb +0 -63
  453. data/lib/bioroebe/toplevel_methods/log_directory.rb +0 -109
  454. data/lib/bioroebe/toplevel_methods/longest_common_substring.rb +0 -55
  455. data/lib/bioroebe/toplevel_methods/map_ncbi_entry_to_eutils_id.rb +0 -88
  456. data/lib/bioroebe/toplevel_methods/matches.rb +0 -259
  457. data/lib/bioroebe/toplevel_methods/misc.rb +0 -596
  458. data/lib/bioroebe/toplevel_methods/nucleotides.rb +0 -787
  459. data/lib/bioroebe/toplevel_methods/number_of_clones.rb +0 -63
  460. data/lib/bioroebe/toplevel_methods/open_in_browser.rb +0 -79
  461. data/lib/bioroebe/toplevel_methods/open_reading_frames.rb +0 -236
  462. data/lib/bioroebe/toplevel_methods/opn.rb +0 -34
  463. data/lib/bioroebe/toplevel_methods/palindromes.rb +0 -155
  464. data/lib/bioroebe/toplevel_methods/parse.rb +0 -59
  465. data/lib/bioroebe/toplevel_methods/phred_error_probability.rb +0 -68
  466. data/lib/bioroebe/toplevel_methods/rds.rb +0 -24
  467. data/lib/bioroebe/toplevel_methods/remove.rb +0 -86
  468. data/lib/bioroebe/toplevel_methods/return_source_code_of_this_method.rb +0 -35
  469. data/lib/bioroebe/toplevel_methods/return_subsequence_based_on_indices.rb +0 -68
  470. data/lib/bioroebe/toplevel_methods/rna_splicing.rb +0 -73
  471. data/lib/bioroebe/toplevel_methods/rnalfold.rb +0 -69
  472. data/lib/bioroebe/toplevel_methods/searching_and_finding.rb +0 -116
  473. data/lib/bioroebe/toplevel_methods/shuffleseq.rb +0 -37
  474. data/lib/bioroebe/toplevel_methods/statistics.rb +0 -53
  475. data/lib/bioroebe/toplevel_methods/sum_of_odd_integers.rb +0 -62
  476. data/lib/bioroebe/toplevel_methods/three_delimiter.rb +0 -34
  477. data/lib/bioroebe/toplevel_methods/time_and_date.rb +0 -53
  478. data/lib/bioroebe/toplevel_methods/to_camelcase.rb +0 -31
  479. data/lib/bioroebe/toplevel_methods/truncate.rb +0 -48
  480. data/lib/bioroebe/toplevel_methods/url.rb +0 -36
  481. data/lib/bioroebe/toplevel_methods/verbose.rb +0 -59
  482. data/lib/bioroebe/utility_scripts/showorf/constants.rb +0 -31
  483. data/lib/bioroebe/utility_scripts/showorf/help.rb +0 -33
  484. data/lib/bioroebe/utility_scripts/showorf/initialize.rb +0 -52
  485. data/lib/bioroebe/utility_scripts/showorf/menu.rb +0 -68
  486. data/lib/bioroebe/utility_scripts/showorf/reset.rb +0 -36
  487. data/lib/bioroebe/utility_scripts/showorf/run.rb +0 -152
  488. data/lib/bioroebe/utility_scripts/showorf/show.rb +0 -97
  489. /data/doc/{german_names_for_the_aminoacids.md → german_names_for_the_aminoacids/german_names_for_the_aminoacids.md} +0 -0
  490. /data/doc/{pdb_ATOM_entry.md → pdb_ATOM_entry/pdb_ATOM_entry.md} +0 -0
  491. /data/doc/{resources.md → resources/resources.md} +0 -0
  492. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/aminoacid_composition/customized_dialog.rb +0 -0
  493. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/anti_sense_strand/anti_sense_strand.config +0 -0
  494. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.config +0 -0
  495. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.config +0 -0
  496. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/hamming_distance/hamming_distance.config +0 -0
  497. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/levensthein_distance/levensthein_distance.config +0 -0
  498. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/protein_to_DNA/protein_to_DNA.config +0 -0
  499. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/restriction_enzymes/restriction_enzymes.config +0 -0
  500. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/www_finder/www_finder.config +0 -0
  501. /data/lib/bioroebe/yaml/{base_composition_of_dna.yml → base_composition_of_dna/base_composition_of_dna.yml} +0 -0
  502. /data/lib/bioroebe/yaml/{nuclear_localization_sequences.yml → nuclear_localization_sequences/nuclear_localization_sequences.yml} +0 -0
  503. /data/lib/bioroebe/yaml/{talens.yml → talens/talens.yml} +0 -0
@@ -1,68 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/phred_error_probability.rb'
6
- # Bioroebe.phred_error_probability(ARGV)
7
- # =========================================================================== #
8
- module Bioroebe
9
-
10
- # ========================================================================= #
11
- # === Bioroebe.phred_error_probability
12
- #
13
- # Datasets obtained from next-generation reads specify a Phred score
14
- # for each base. This is also known as the "Q score" (Quality score).
15
- #
16
- # The Q score is an integer value, and is typically within the range 2
17
- # to 40. Q indicates the probability that the base call is incorrect (P_e).
18
- #
19
- # For example, Q=2 means that the error probability is 63%, so the machine
20
- # is reporting that the base is more likely to be wrong than right, while
21
- # Q=20 corresponds to an error probability of only 1%.
22
- #
23
- # The second argument to this method can be used to format to a specific
24
- # number. So if we pass in 6 as the second argument then the result will
25
- # be rounded to 6 slots after the first '.'. See the usage examples
26
- # below.
27
- #
28
- # Usage examples:
29
- #
30
- # Bioroebe.phred_error_probability '48'
31
- # Bioroebe.phred_error_probability '48',6 # => "0.000016"
32
- #
33
- # ========================================================================= #
34
- def self.phred_error_probability(
35
- quality_score = 50,
36
- optional_use_this_formatting = nil
37
- )
38
- if quality_score.is_a? Array
39
- quality_score = quality_score.first
40
- end
41
- quality_score = quality_score.to_f # Need a Float past this point.
42
- result = 10 ** (- quality_score / 10.0)
43
- # ======================================================================= #
44
- # Next, do some rounding if the user requested this through the
45
- # second argument to this method.
46
- # ======================================================================= #
47
- if optional_use_this_formatting
48
- if optional_use_this_formatting.is_a? Numeric
49
- use_this_formatting_rule = "%.#{optional_use_this_formatting}f"
50
- result = use_this_formatting_rule % result
51
- else
52
- result = optional_use_this_formatting.to_s % result
53
- end
54
- end
55
- return result
56
- end
57
-
58
- end
59
-
60
- if __FILE__ == $PROGRAM_NAME
61
- if ARGV.empty?
62
- (1 .. 40).each {|entry|
63
- puts "#{entry.to_s.ljust(3)} #{Bioroebe.phred_error_probability(entry)}"
64
- }
65
- else
66
- puts Bioroebe.phred_error_probability(ARGV)
67
- end
68
- end # phrederrorprobability 48
@@ -1,24 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/rds.rb'
6
- # =========================================================================== #
7
- module Bioroebe
8
-
9
- # ========================================================================= #
10
- # === Bioroebe.rds
11
- #
12
- # rds is an abbreviation and is short for "remove double slashes".
13
- #
14
- # We will thus get rid of too many '/' tokens in a given string,
15
- # via this method.
16
- #
17
- # This is mostly used in order to sanitize local file paths, as
18
- # "foo//bar" entries look quite ugly.
19
- # ========================================================================= #
20
- def self.rds(i)
21
- i.squeeze('/')
22
- end
23
-
24
- end
@@ -1,86 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/remove.rb'
6
- # Bioroebe.remove_numbers(ARGV)
7
- # =========================================================================== #
8
- module Bioroebe
9
-
10
- # ========================================================================= #
11
- # === Bioroebe.remove_numbers
12
- #
13
- # This method will simply remove numbers from the given input at hand.
14
- #
15
- # Usage example:
16
- #
17
- # Bioroebe.remove_numbers("abc123def")
18
- #
19
- # ========================================================================= #
20
- def self.remove_numbers(i = ARGV)
21
- if i.is_a? Array
22
- i = i.join
23
- end
24
- i.gsub(/[0-9]/,'')
25
- end; self.instance_eval { alias remove_numbers_from remove_numbers } # === Bioroebe.remove_numbers_from
26
-
27
- # ========================================================================= #
28
- # === Bioroebe.remove_subsequence
29
- #
30
- # This method will remove one or more subsequences from a given
31
- # String at hand. The String that you wish to modify, should be
32
- # given as the second argument to this method, called `from`.
33
- #
34
- # The first argument to this method can be an Array or a String - in
35
- # either case, if the variable `from` contains this sequence, it
36
- # will be removed.
37
- #
38
- # Note that only the FIRST occurence found will be removed - the others
39
- # will be ignored, if they exist.
40
- #
41
- # The second argument to this method must be a String.
42
- #
43
- # Usage example:
44
- #
45
- # Bioroebe.remove_subsequence(["ATCGGTCGAA", "ATCGGTCGAGCGTGT"], 'ATGGTCTACATAGCTGACAAACAGCACGTAGCAATCGGTCGAATCTCGAGAGGCATATGGTCACATGATCGGTCGAGCGTGTTTCAAAGTTTGCGCCTAG')
46
- # Bioroebe.remove_subsequence(array, main_sequence)
47
- #
48
- # ========================================================================= #
49
- def self.remove_subsequence(
50
- subsequence,
51
- from # ← Must be a String.
52
- )
53
- unless from.is_a? String
54
- raise 'Please input a String as second argument to this method.'
55
- end
56
- unless subsequence.is_a? Array
57
- subsequence = [subsequence].flatten
58
- end
59
- from = from.dup if from.frozen?
60
- subsequence.each {|this_subsequence|
61
- from.sub!(/#{this_subsequence}/,'')
62
- }
63
- from # Return the, possibly modified, String here.
64
- end; self.instance_eval { alias remove_subsequences remove_subsequence } # === Bioroebe.remove_subsequences
65
-
66
- end
67
-
68
- if __FILE__ == $PROGRAM_NAME
69
- require 'colours/autoinclude'
70
- alias e puts
71
- main_sequence = 'ATGGTCTACATAGCTGACAAACAGCACGTAGCAATCGGTCGAATCTCGAGAGGCATATGGTCACATGATCGGTCGAGCGTGTTTCAAAGTTTGCGCCTAG'
72
- subsequence1 = 'ATCGGTCGAA'
73
- subsequence2 = 'ATCGGTCGAGCGTGT'
74
- e "#{Colours.rev}The main sequence is:"
75
- e
76
- e " #{Colours.lightgreen(main_sequence)} (size: #{main_sequence.size})"
77
- e
78
- e 'The two subsequences '+Colours.slateblue(subsequence1)+
79
- ' and '+Colours.slateblue(subsequence2)+' will be removed next.'
80
- e
81
- e 'And now the resulting new String is:'
82
- e
83
- new_string = Bioroebe.remove_subsequence([subsequence1, subsequence2], main_sequence)
84
- e " #{Colours.lightgreen(new_string)} (size: #{new_string.size})"
85
- e
86
- end # removesubsequence
@@ -1,35 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/return_source_code_of_this_method.rb'
6
- # Bioroebe.return_source_code_of_this_method
7
- # =========================================================================== #
8
- module Bioroebe
9
-
10
- # ========================================================================= #
11
- # === Bioroebe.return_source_code_of_this_method
12
- #
13
- # This method will return the source code of a particular method.
14
- #
15
- # Note that the method will stop at the first 'end' encountered.
16
- # ========================================================================= #
17
- def self.return_source_code_of_this_method(i)
18
- if i.is_a? Array
19
- i = i.first
20
- end
21
- content = i.source_location
22
- full_content = File.readlines(
23
- content[0].to_s
24
- )[ (content[1]-1) .. -1 ].join.to_s
25
- if full_content.include? 'end'
26
- full_content = full_content[0 .. full_content.index('end')+2]
27
- end
28
- return full_content
29
- end
30
-
31
- end
32
-
33
- if __FILE__ == $PROGRAM_NAME
34
- Bioroebe.return_source_code_of_this_method
35
- end
@@ -1,68 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/return_subsequence_based_on_indices.rb'
6
- # Bioroebe.return_subsequence_based_on_indices
7
- # =========================================================================== #
8
- module Bioroebe
9
-
10
- # ========================================================================= #
11
- # === Bioroebe.return_subsequence_based_on_indices
12
- #
13
- # This method will return a subsequence that was sliced out from the
14
- # given input array of indices (the second argument to this method).
15
- #
16
- # This method here also allows us to read from an existing File. The
17
- # format of that file has to be simple, though - the first line must
18
- # be the sequence; and the second line will constitute the array
19
- # of indices.
20
- #
21
- # For a usage example, see the end of this file here please. It has
22
- # been written primarily to solve a specific task at Rosalind.
23
- # ========================================================================= #
24
- def self.return_subsequence_based_on_indices(
25
- i, *array_of_indices
26
- )
27
- if array_of_indices.is_a? Array
28
- array_of_indices.map! {|entry| entry.to_i }
29
- end
30
- result = ''.dup
31
- if i and i.is_a?(String) and File.exist?(i)
32
- dataset = File.readlines(i).reject {|line| line.strip.empty? }
33
- i = dataset.first
34
- array_of_indices = dataset.last.split(' ').map(&:to_i)
35
- end
36
- array_of_indices.each_slice(2).each {|a, b|
37
- result << i[a .. b]+' '
38
- }
39
- result.strip
40
- end
41
-
42
- end
43
-
44
- if __FILE__ == $PROGRAM_NAME
45
- a = 22 # These four variables determine the sub-indices.
46
- b = 27
47
- c = 97
48
- d = 102
49
- if ARGV.empty?
50
- test_this_string = 'HumptyDumptysatonawallHumptyDumpty'\
51
- 'hadagreatfallAlltheKingshorsesandalltheKingsmen'\
52
- 'CouldntputHumptyDumptyinhisplaceagain.'
53
- else
54
- test_this_string = ARGV.first
55
- if test_this_string and File.file?(test_this_string)
56
- dataset = File.readlines(test_this_string)
57
- test_this_string = dataset.first
58
- splitted = dataset.last.split(' ')
59
- a = splitted[0]
60
- b = splitted[1]
61
- c = splitted[2]
62
- d = splitted[3]
63
- end
64
- end
65
- puts Bioroebe.return_subsequence_based_on_indices(
66
- test_this_string, a, b, c, d
67
- )
68
- end # returnsubsequencebasedonindices /HUM.txt
@@ -1,73 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioreobe/module_methods/rna_splicing.rb'
6
- # =========================================================================== #
7
- module Bioroebe
8
-
9
- require 'bioroebe/toplevel_methods/remove.rb'
10
-
11
- # ========================================================================= #
12
- # === Bioroebe.rna_splicing
13
- #
14
- # This is a VERY primitive method that has been written primarily to
15
- # solve a specific question on Rosalind.
16
- #
17
- # This is NOT how splicing normally works - but it works to solve
18
- # the given question at Rosalind.
19
- #
20
- # Invocation example:
21
- #
22
- # Bioroebe.rna_splicing('/SPLICING.md')
23
- #
24
- # ========================================================================= #
25
- def self.rna_splicing(i)
26
- require 'bioroebe/fasta_and_fastq/parse_fasta/parse_fasta.rb'
27
- if i and File.exist?(i)
28
- # ===================================================================== #
29
- # Read in the file should it exist.
30
- # ===================================================================== #
31
- i = File.read(i).strip
32
- end
33
- if i.is_a?(String) and i.include?('>')
34
- _ = ::Bioroebe::ParseFasta.new(i) { :be_quiet }
35
- sequences = _.sequences?
36
- main_sequence = sequences.first
37
- array_subsequences = sequences[1 .. -1]
38
- result = ::Bioroebe.remove_subsequence(array_subsequences, main_sequence)
39
- return result
40
- end
41
- end
42
-
43
- end
44
-
45
- if __FILE__ == $PROGRAM_NAME
46
- alias e puts
47
- if ARGV.empty?
48
- use_this_dataset = '>Rosalind_10
49
- ATGGTCTACATAGCTGACAAACAGCACGTAGCAATCGGTCGAATCTCGAGAGGCATATGGTCACATGATCGGTCGAGCGTGTTTCAAAGTTTGCGCCTAG
50
- >Rosalind_12
51
- ATCGGTCGAA
52
- >Rosalind_15
53
- ATCGGTCGAGCGTGT'
54
- else
55
- use_this_dataset = ARGV.first
56
- end
57
- e 'Original input is:'
58
- e
59
- e 'ATGGTCTACATAGCTGACAAACAGCACGTAGCAATCGGTCGAATCTCGAGAGGCATATGGTCACATGATCGGTCGAGCGTGTTTCAAAGTTTGCGCCTAG'
60
- e
61
- result = Bioroebe.rna_splicing use_this_dataset
62
- e result
63
- # ========================================================================= #
64
- # The next code is if you need an aminoacid sequence:
65
- # ========================================================================= #
66
- e
67
- e 'This corresponds to these aminoacids:'
68
- e
69
- e Bioroebe.to_aa(result)
70
- e
71
- end # rnasplicing
72
- # rnasplicing /RNA_SPLICING.md
73
- # rnasplicing /SPLICING.md
@@ -1,69 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/rnalfold.rb'
6
- # =========================================================================== #
7
- module Bioroebe
8
-
9
- require 'bioroebe/toplevel_methods/e.rb'
10
-
11
- # ========================================================================= #
12
- # === Bioroebe.rnalfold
13
- #
14
- # This method allows us to make use of RNALfold. By default the method
15
- # will attempt to obtain all .fa files in the current directory; this
16
- # should simplify batch-processing.
17
- #
18
- # Otherwise, the first input argument to this method should be the
19
- # file(s) that you wish to manipulate.
20
- #
21
- # A typical usage example may be:
22
- #
23
- # Bioroebe.rnalfold { '--zscore=-3 -L 200' }
24
- #
25
- # ========================================================================= #
26
- def self.rnalfold(
27
- i = :use_all_fasta_files_in_the_current_directory
28
- )
29
- require 'bioroebe/colours/sfancy.rb'
30
- require 'bioroebe/colours/sfile.rb'
31
- # ======================================================================= #
32
- # RNALfold will be used (as command).
33
- # ======================================================================= #
34
- use_this_command = 'RNALfold'.dup
35
- case i
36
- when :default,
37
- :use_all_fasta_files_in_the_current_directory
38
- i = Dir['**.fa']
39
- end
40
- if block_given?
41
- yielded = yield
42
- # ===================================================================== #
43
- # Simply append these block-commands in that case:
44
- # ===================================================================== #
45
- use_this_command << " #{yielded}"
46
- end
47
- # ======================================================================= #
48
- # We assume that our input is an Array past this point.
49
- # ======================================================================= #
50
- i.each {|this_file|
51
- e "Working on `#{sfancy(this_file)}` next."
52
- new_filename = this_file.dup
53
- regex_to_use = /-L (\d+)/
54
- use_this_command =~ regex_to_use
55
- new_filename << '.'+$1.to_s.dup
56
- new_filename << '.lfold'
57
- _ = use_this_command+' < '+this_file+' > '+new_filename
58
- esystem _
59
- if File.exist? new_filename
60
- e "A new file has been created at `#{sfile(new_filename)}`."
61
- end
62
- }
63
- end
64
-
65
- end
66
-
67
- if __FILE__ == $PROGRAM_NAME
68
- Bioroebe.rnalfold { '--zscore=-3 -L 200' }
69
- end # bioroebernalfold
@@ -1,116 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # The file here will contain code that is related to "find"-ing something,
6
- # typically within another string or object or dataset.
7
- # =========================================================================== #
8
- # require 'bioroebe/toplevel_methods/searching_and_finding.rb'
9
- # Bioroebe.find_substring 'GATATATGCATATACTT', 'ATAT' # => [2, 4, 10]
10
- # =========================================================================== #
11
- module Bioroebe
12
-
13
- # ========================================================================= #
14
- # === Bioroebe.find_substring
15
- #
16
- # This method can be used to find a substring within a larger String.
17
- #
18
- # For example, in the below default values, the substring "ATAT"
19
- # would exist at the positions 2, 4 and 10, if compared to the
20
- # larger parent string "GATATATGCATATACTT".
21
- #
22
- # The following display may help you see this more easily, in
23
- # regards to the substring matches:
24
- #
25
- # GATATATGCATATACTT
26
- # ATATAT ATAT
27
- #
28
- # If you look closely, you will be able to see that "ATAT" can
29
- # be found three times in the string above.
30
- #
31
- # Indices in this context start at position 1, not 0. This is
32
- # mostly done to refer to nucleotides or aminoacids, which
33
- # also typically start at the first letter. Position 0 makes
34
- # no sense for a nucleotide - what would "nucleotide 0" even
35
- # refer to?
36
- #
37
- # The first argument to this method may also be the path to a
38
- # locally existing file, such as "/rosalind_subs.txt". In
39
- # fact this method has been largely motivated by Rosalind
40
- # tasks.
41
- #
42
- # The method will return an Array with the positions of all
43
- # substrings that are found in the full_string variable. See
44
- # the usage example below for how this may be.
45
- #
46
- # Usage example:
47
- #
48
- # Bioroebe.find_substring 'GATATATGCATATACTT', 'ATAT' # => [2, 4, 10]
49
- #
50
- # ========================================================================= #
51
- def self.find_substring(
52
- full_string = 'GATATATGCATATACTT', # ← The full String comes here.
53
- this_substring = :default # ← The substring we are searching for comes here.
54
- )
55
- if full_string.is_a? Array
56
- # ===================================================================== #
57
- # Presently this method will only work on the first member of an Array.
58
- # ===================================================================== #
59
- full_string = full_string.first
60
- end
61
- if full_string and File.file?(full_string) and
62
- this_substring == :default
63
- # ===================================================================== #
64
- # In this case it is ok to read from that file.
65
- # ===================================================================== #
66
- _ = File.read(full_string)
67
- splitted = _.split("\n")
68
- full_string = splitted.first
69
- this_substring = splitted.last
70
- end
71
- case this_substring
72
- # ======================================================================= #
73
- # Use a default value in this case. In reality users should supply
74
- # their own substring when they use this method here.
75
- # ======================================================================= #
76
- when :default,
77
- nil
78
- this_substring = 'ATAT'
79
- else
80
- if this_substring.empty?
81
- this_substring = 'ATAT'
82
- end
83
- end
84
- if full_string.nil? or full_string.empty?
85
- full_string = 'GATATATGCATATACTT' # ← Use the default in this case.
86
- end
87
- result = Array.new.tap { |indexes|
88
- final_index_position = full_string.size - this_substring.size
89
- i = 0
90
- while (i < final_index_position)
91
- index = full_string.to_s.index(this_substring.to_s, i)
92
- break if index.nil?
93
- i = index + 1
94
- indexes << i
95
- end
96
- }
97
- result = nil if result.empty? # ← We will try this here; could also return an empty Array, though.
98
- result # Return our findings here.
99
- end; self.instance_eval { alias find_substring_indices find_substring } # === Bioroebe.find_substring_indices
100
-
101
- end
102
-
103
- if __FILE__ == $PROGRAM_NAME
104
- if File.exist?(ARGV.first)
105
- # ======================================================================= #
106
- # Handle locally existing files first.
107
- # ======================================================================= #
108
- puts Bioroebe.find_substring(ARGV.first).join(' ').strip
109
- else
110
- puts Bioroebe.find_substring(ARGV[0], ARGV[1]).join(' ').strip
111
- end
112
- end # findsubstring TATATA AT
113
- # findsubstring TATATATA AT
114
- # findsubstring GATATATGCATATACTT ATAT
115
- # findsubstring GATATATGCATATACTT ATAT
116
- # findsubstring /rosalind_subs.txt
@@ -1,37 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/shuffleseq.rb'
6
- # Bioroebe.shuffleseq
7
- # =========================================================================== #
8
- module Bioroebe
9
-
10
- # ========================================================================= #
11
- # === Bioroebe.shuffleseq
12
- #
13
- # This method simulates the Emboss shuffleseq-functionality. It will
14
- # take the input string, such as an assumed DNA sequence, and simply
15
- # re-arrange it as-is.
16
- #
17
- # You can read this here:
18
- #
19
- # https://www.bioinformatics.nl/cgi-bin/emboss/shuffleseq
20
- #
21
- # Usage example:
22
- #
23
- # Bioroebe.shuffleseq 'ATCGATCG' # => "AGTTACGC"
24
- #
25
- # ========================================================================= #
26
- def self.shuffleseq(i = ARGV)
27
- if i.is_a? Array
28
- i = i.join(' ').strip
29
- end
30
- return i.chars.shuffle.join
31
- end; self.instance_eval { alias randomize_the_sequence shuffleseq } # === Bioroebe.randomize_the_sequence
32
-
33
- end
34
-
35
- if __FILE__ == $PROGRAM_NAME
36
- puts Bioroebe.shuffleseq(ARGV)
37
- end # shuffleseq ATCGATCG
@@ -1,53 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/statistics.rb'
6
- # Bioroebe.show_exon_statistics
7
- # =========================================================================== #
8
- module Bioroebe
9
-
10
- require 'bioroebe/colours/colours.rb'
11
- require 'bioroebe/toplevel_methods/e.rb'
12
- require 'bioroebe/toplevel_methods/esystem.rb'
13
- require 'bioroebe/toplevel_methods/file_and_directory_related_actions.rb'
14
-
15
- # ========================================================================= #
16
- # === Bioroebe.show_exon_statistics
17
- #
18
- # This is mostly "throw-away" code; it will quickly tell us how many
19
- # exons may span over some junction.
20
- #
21
- # It was specifically created to analyze a .gtf file.
22
- #
23
- # Invocation example:
24
- #
25
- # bioroebe --show-exon-statistics-for=/tmp/praktikum/Mouse/chromosome_8/parsed/cdna.8.L100.global.gtf
26
- #
27
- # ========================================================================= #
28
- def self.show_exon_statistics(these_files)
29
- [these_files].flatten.compact.each {|this_file|
30
- if File.exist? this_file
31
- result = `cat #{this_file} | awk '{print $12}' | sort | uniq -c | sort -k1n | awk '{print $1}' | sort | uniq -c | less`
32
- e gold(' n exons')
33
- splitted = result.split("\n")
34
- # =================================================================== #
35
- # splitted may look like this:
36
- #
37
- # [" 89839 1", " 26031 2", " 1136 3", " 24 4"]
38
- #
39
- # =================================================================== #
40
- splitted.each {|line|
41
- e line.sub(/( \d+)$/, gold('\1'))
42
- }
43
- else
44
- no_file_exists_at(this_file)
45
- end
46
- }
47
- end
48
-
49
- end
50
-
51
- if __FILE__ == $PROGRAM_NAME
52
- Bioroebe.show_exon_statistics(ARGV)
53
- end # showexonstatistics /tmp/praktikum/Mouse/chromosome_8/parsed/cdna.8.L100.global.gtf