bioroebe 0.12.24 → 0.13.31

Sign up to get free protection for your applications and to get access to all the features.
Files changed (503) hide show
  1. checksums.yaml +4 -4
  2. data/LICENSE.md +7 -8
  3. data/README.md +566 -354
  4. data/bin/all_positions_of_this_nucleotide +1 -1
  5. data/bin/aminoacid_frequencies +1 -1
  6. data/bin/automatically_rename_this_fasta_file +1 -1
  7. data/bin/base_composition +1 -1
  8. data/bin/batch_create_windows_executables +1 -1
  9. data/bin/bioroebe +12 -1
  10. data/bin/bioroebe_cat +7 -0
  11. data/bin/calculate_exponential_growth +7 -0
  12. data/bin/calculate_n50_value +1 -1
  13. data/bin/calculate_the_frequencies_of_this_species +7 -0
  14. data/bin/chunked_display +1 -1
  15. data/bin/codon_frequency +1 -1
  16. data/bin/codon_to_aminoacid +1 -1
  17. data/bin/colourize_this_fasta_sequence +1 -1
  18. data/bin/complementary_dna_strand +1 -1
  19. data/bin/complementary_rna_strand +1 -1
  20. data/bin/consensus_sequence +1 -1
  21. data/bin/dna_to_rna +1 -1
  22. data/bin/downcase_chunked_display +1 -1
  23. data/bin/download_this_pdb +1 -1
  24. data/bin/fasta_index +1 -1
  25. data/bin/fetch_data_from_uniprot +1 -1
  26. data/bin/filter_away_invalid_nucleotides +1 -1
  27. data/bin/find_substring +1 -1
  28. data/bin/input_as_dna +1 -1
  29. data/bin/is_palindrome +1 -1
  30. data/bin/leading_five_prime +1 -1
  31. data/bin/longest_ORF +1 -1
  32. data/bin/longest_substring +1 -1
  33. data/bin/open_reading_frames +1 -1
  34. data/bin/partner_nucleotide +1 -1
  35. data/bin/plain_palindrome +1 -1
  36. data/bin/random_dna_sequence +1 -1
  37. data/bin/random_sequence +1 -1
  38. data/bin/raw_hamming_distance +1 -1
  39. data/bin/return_longest_substring_via_LCS_algorithm +1 -1
  40. data/bin/reverse_sequence +1 -1
  41. data/bin/short_aminoacid_letter_from_long_aminoacid_name +1 -1
  42. data/bin/show_atomic_composition +1 -1
  43. data/bin/show_fasta_header +1 -1
  44. data/bin/show_nucleotide_sequence +1 -1
  45. data/bin/show_this_dna_sequence +1 -1
  46. data/bin/show_time_now +7 -0
  47. data/bin/sort_aminoacid_based_on_its_hydrophobicity +1 -1
  48. data/bin/strict_filter_away_invalid_aminoacids +1 -1
  49. data/{lib/bioroebe/base/reset.rb → bin/three_delimiter} +9 -6
  50. data/bin/three_to_one +1 -1
  51. data/bin/to_rna +1 -1
  52. data/bin/trailing_three_prime +1 -1
  53. data/bin/upcase_this_aminoacid_sequence_and_remove_numbers +1 -1
  54. data/bioroebe.gemspec +6 -7
  55. data/doc/README.gen +534 -322
  56. data/doc/blosum/blosum.md +4 -0
  57. data/doc/compatibility/BIO_PHP.md +20 -18
  58. data/doc/compatibility/README.md +2 -3
  59. data/doc/compatibility/emboss.md +5 -3
  60. data/doc/{extensive_usage_example.md → extensive_usage_example/extensive_usage_example.md} +4 -2
  61. data/doc/{instructions_for_the_taxonomy_subproject.md → instructions_for_the_taxonomy_subproject/instructions_for_the_taxonomy_subproject.md} +36 -33
  62. data/doc/{legacy_paths.md → legacy_paths/legacy_paths.md} +3 -3
  63. data/doc/statistics/statistics.md +12 -10
  64. data/doc/todo/bioroebe_GUI_todo.md +6 -1
  65. data/doc/todo/bioroebe_java_todo.md +3 -2
  66. data/doc/todo/bioroebe_todo.md +328 -310
  67. data/doc/{using_biomart.md → using_biomart/using_biomart.md} +7 -3
  68. data/lib/bioroebe/abstract/features.rb +0 -0
  69. data/lib/bioroebe/aminoacids/aminoacid_substitution.rb +1 -1
  70. data/lib/bioroebe/aminoacids/aminoacids_mass_table.rb +3 -1
  71. data/lib/bioroebe/aminoacids/codon_percentage.rb +18 -10
  72. data/lib/bioroebe/aminoacids/create_random_aminoacids.rb +5 -2
  73. data/lib/bioroebe/aminoacids/deduce_aminoacid_sequence.rb +90 -64
  74. data/lib/bioroebe/aminoacids/display_aminoacid_table.rb +1 -3
  75. data/lib/bioroebe/aminoacids/show_hydrophobicity.rb +2 -2
  76. data/lib/bioroebe/annotations/create_annotation_format.rb +2 -2
  77. data/lib/bioroebe/base/base.rb +101 -6
  78. data/lib/bioroebe/base/base_module/base_module.rb +9 -1
  79. data/lib/bioroebe/base/colours.rb +3 -0
  80. data/lib/bioroebe/base/colours_for_base/colours_for_base.rb +80 -44
  81. data/lib/bioroebe/base/commandline_application/README.md +1 -1
  82. data/lib/bioroebe/base/commandline_application/commandline_application.rb +661 -22
  83. data/lib/bioroebe/base/commandline_application/commandline_arguments.rb +2 -1
  84. data/lib/bioroebe/base/infer_the_namespace_module/infer_the_namespace_module.rb +37 -0
  85. data/lib/bioroebe/base/internal_hash_module/internal_hash_module.rb +1 -6
  86. data/lib/bioroebe/base/prototype/prototype.rb +155 -14
  87. data/lib/bioroebe/biomart/attribute.rb +1 -1
  88. data/lib/bioroebe/biomart/biomart.rb +8 -9
  89. data/lib/bioroebe/biomart/server.rb +1 -1
  90. data/lib/bioroebe/blosum/blosum.rb +2 -2
  91. data/lib/bioroebe/calculate/calculate_blosum_score.rb +5 -3
  92. data/lib/bioroebe/calculate/calculate_gc_content.rb +1 -1
  93. data/lib/bioroebe/calculate/calculate_levensthein_distance.rb +5 -3
  94. data/lib/bioroebe/calculate/calculate_melting_temperature.rb +2 -10
  95. data/lib/bioroebe/calculate/calculate_melting_temperature_for_more_than_thirteen_nucleotides.rb +6 -15
  96. data/lib/bioroebe/calculate/calculate_the_position_specific_scoring_matrix.rb +4 -2
  97. data/lib/bioroebe/cell/cell.rb +3 -2
  98. data/lib/bioroebe/cell/specialized_cells/B_cell.rb +60 -0
  99. data/lib/bioroebe/cell/specialized_cells/Macrophage.rb +60 -0
  100. data/lib/bioroebe/cell/specialized_cells/README.md +5 -0
  101. data/lib/bioroebe/cell/specialized_cells/T_cell.rb +60 -0
  102. data/lib/bioroebe/cleave_and_digest/cleave.rb +3 -1
  103. data/lib/bioroebe/cleave_and_digest/digestion.rb +1 -1
  104. data/lib/bioroebe/codon_tables/frequencies/10090_Mus_musculus.yml +93 -0
  105. data/lib/bioroebe/codon_tables/frequencies/107243_Thlaspi_caerulescens.yml +72 -0
  106. data/lib/bioroebe/codon_tables/frequencies/parse_frequency_table.rb +2 -2
  107. data/lib/bioroebe/codons/codon_table.rb +10 -2
  108. data/lib/bioroebe/codons/codons.rb +3 -3
  109. data/lib/bioroebe/codons/convert_this_codon_to_that_aminoacid.rb +18 -15
  110. data/lib/bioroebe/codons/determine_optimal_codons.rb +1 -1
  111. data/lib/bioroebe/codons/possible_codons_for_this_aminoacid.rb +4 -2
  112. data/lib/bioroebe/codons/show_codon_tables.rb +1 -1
  113. data/lib/bioroebe/codons/show_codon_usage.rb +1 -2
  114. data/lib/bioroebe/codons/show_this_codon_table.rb +2 -2
  115. data/lib/bioroebe/codons/start_codons.rb +7 -3
  116. data/lib/bioroebe/colours/colour_schemes/README.md +1 -1
  117. data/lib/bioroebe/colours/colour_schemes/array_available_colour_schemes.rb +3 -3
  118. data/lib/bioroebe/colours/colour_schemes/colour_scheme.rb +3 -3
  119. data/lib/bioroebe/colours/colour_schemes/colour_scheme_demo.rb +4 -3
  120. data/lib/bioroebe/colours/colour_schemes/helix.rb +3 -1
  121. data/lib/bioroebe/colours/colour_schemes/hydropathy.rb +3 -1
  122. data/lib/bioroebe/colours/colour_schemes/score.rb +13 -2
  123. data/lib/bioroebe/colours/colour_schemes/strand.rb +3 -1
  124. data/lib/bioroebe/colours/colour_schemes/turn.rb +3 -1
  125. data/lib/bioroebe/colours/colour_schemes/zappo.rb +1 -1
  126. data/lib/bioroebe/{toplevel_methods/colourize_related_methods.rb → colours/colourize_related_code.rb} +1 -3
  127. data/lib/bioroebe/colours/colourize_sequence.rb +3 -1
  128. data/lib/bioroebe/colours/colours.rb +172 -15
  129. data/lib/bioroebe/configuration/configuration.rb +1 -1
  130. data/lib/bioroebe/constants/GUIs.rb +2 -2
  131. data/lib/bioroebe/constants/constants.rb +1349 -0
  132. data/lib/bioroebe/conversions/convert_aminoacid_to_dna.rb +8 -13
  133. data/lib/bioroebe/conversions/dna_to_aminoacid_sequence.rb +9 -3
  134. data/lib/bioroebe/count/count_amount_of_aminoacids.rb +11 -10
  135. data/lib/bioroebe/count/count_amount_of_nucleotides.rb +1 -1
  136. data/lib/bioroebe/count/count_at.rb +2 -1
  137. data/lib/bioroebe/databases/download_taxonomy_database.rb +1 -1
  138. data/lib/bioroebe/dotplots/advanced_dotplot.rb +2 -2
  139. data/lib/bioroebe/electron_microscopy/coordinate_analyzer.rb +2 -2
  140. data/lib/bioroebe/electron_microscopy/fix_pos_file.rb +2 -2
  141. data/lib/bioroebe/electron_microscopy/flipy.rb +2 -2
  142. data/lib/bioroebe/electron_microscopy/generate_em2em_file.rb +3 -11
  143. data/lib/bioroebe/electron_microscopy/parse_coordinates.rb +6 -6
  144. data/lib/bioroebe/electron_microscopy/read_file_xmd.rb +6 -6
  145. data/lib/bioroebe/electron_microscopy/simple_star_file_generator.rb +2 -2
  146. data/lib/bioroebe/enzymes/has_this_restriction_enzyme.rb +1 -1
  147. data/lib/bioroebe/enzymes/restriction_enzyme.rb +1 -1
  148. data/lib/bioroebe/enzymes/restriction_enzymes/statistics.rb +4 -3
  149. data/lib/bioroebe/enzymes/restriction_enzymes_file.rb +1 -1
  150. data/lib/bioroebe/enzymes/return_sequence_that_is_cut_via_restriction_enzyme.rb +4 -3
  151. data/lib/bioroebe/enzymes/show_restriction_enzymes.rb +3 -3
  152. data/lib/bioroebe/ext/main.cpp +0 -1
  153. data/lib/bioroebe/fasta_and_fastq/autocorrect_the_name_of_this_fasta_file.rb +3 -3
  154. data/lib/bioroebe/fasta_and_fastq/compact_fasta_file/compact_fasta_file.rb +1 -1
  155. data/lib/bioroebe/fasta_and_fastq/display_how_many_fasta_entries_are_in_this_directory.rb +1 -1
  156. data/lib/bioroebe/fasta_and_fastq/download_fasta.rb +8 -14
  157. data/lib/bioroebe/fasta_and_fastq/fasta_defline/fasta_defline.rb +1 -1
  158. data/lib/bioroebe/fasta_and_fastq/fasta_to_yaml/fasta_to_yaml.rb +1 -1
  159. data/lib/bioroebe/fasta_and_fastq/fastq_format_explainer.rb +1 -1
  160. data/lib/bioroebe/fasta_and_fastq/length_modifier/length_modifier.rb +1 -1
  161. data/lib/bioroebe/fasta_and_fastq/parse_fasta/parse_fasta.rb +37 -11
  162. data/lib/bioroebe/fasta_and_fastq/parse_fastq/parse_fastq.rb +2 -2
  163. data/lib/bioroebe/fasta_and_fastq/return_fasta_subsection_of_this_file.rb +1 -1
  164. data/lib/bioroebe/fasta_and_fastq/show_fasta_headers.rb +5 -13
  165. data/lib/bioroebe/fasta_and_fastq/show_fasta_statistics.rb +1 -1
  166. data/lib/bioroebe/fasta_and_fastq/simplify_fasta_header/simplify_fasta_header.rb +1 -1
  167. data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/reset.rb +3 -6
  168. data/lib/bioroebe/fasta_and_fastq/split_this_fasta_file_into_chromosomes/split_this_fasta_file_into_chromosomes.rb +3 -3
  169. data/lib/bioroebe/genbank/genbank_flat_file_format_generator.rb +20 -11
  170. data/lib/bioroebe/genome/genome.rb +1 -1
  171. data/lib/bioroebe/genomes/genome_pattern.rb +17 -16
  172. data/lib/bioroebe/genomes/genome_retriever.rb +4 -2
  173. data/lib/bioroebe/gui/experimental/snapgene/snapgene.rb +10 -13
  174. data/lib/bioroebe/gui/universal_widgets/alignment/alignment.rb +557 -0
  175. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/aminoacid_composition/aminoacid_composition.rb +498 -198
  176. data/lib/bioroebe/gui/universal_widgets/anti_sense_strand/anti_sense_strand.rb +665 -0
  177. data/lib/bioroebe/gui/universal_widgets/blosum_matrix_viewer/blosum_matrix_viewer.rb +329 -0
  178. data/lib/bioroebe/gui/universal_widgets/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +423 -0
  179. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/controller/controller.rb +170 -118
  180. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +277 -215
  181. data/lib/bioroebe/gui/{shared_code/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget_module.rb → universal_widgets/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb} +297 -107
  182. data/lib/bioroebe/gui/universal_widgets/fasta_table_widget/fasta_table_widget.rb +643 -0
  183. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/format_converter/format_converter.rb +236 -164
  184. data/lib/bioroebe/gui/universal_widgets/gene/gene.rb +278 -0
  185. data/lib/bioroebe/gui/universal_widgets/hamming_distance/hamming_distance.rb +646 -0
  186. data/lib/bioroebe/gui/{shared_code/levensthein_distance/levensthein_distance_module.rb → universal_widgets/levensthein_distance/levensthein_distance.rb} +313 -88
  187. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/nucleotide_analyser/nucleotide_analyser.rb +281 -189
  188. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/parse_pdb_file/parse_pdb_file.rb +265 -149
  189. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/primer_design_widget/primer_design_widget.rb +337 -263
  190. data/lib/bioroebe/gui/universal_widgets/protein_to_DNA/protein_to_DNA.rb +408 -0
  191. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/random_sequence/random_sequence.rb +245 -187
  192. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/restriction_enzymes/restriction_enzymes.rb +207 -137
  193. data/lib/bioroebe/gui/universal_widgets/shell/shell.rb +288 -0
  194. data/lib/bioroebe/gui/{gtk3/show_codon_table/misc.rb → universal_widgets/show_codon_table/show_codon_table.rb} +290 -110
  195. data/lib/bioroebe/gui/{shared_code/show_codon_usage/show_codon_usage_module.rb → universal_widgets/show_codon_usage/show_codon_usage.rb} +228 -47
  196. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/sizeseq/sizeseq.rb +151 -69
  197. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/three_to_one/three_to_one.rb +190 -127
  198. data/lib/bioroebe/gui/{gtk3 → universal_widgets}/www_finder/www_finder.rb +211 -152
  199. data/lib/bioroebe/images/images.html +953 -1170
  200. data/lib/bioroebe/images/misc/README.md +6 -0
  201. data/lib/bioroebe/images/misc/activation.avif +0 -0
  202. data/lib/bioroebe/images/misc/inhibition.avif +0 -0
  203. data/lib/bioroebe/images/misc/small_virus_logo.avif +0 -0
  204. data/lib/bioroebe/{constants/base_directory.rb → log_directory/log_directory.rb} +79 -59
  205. data/lib/bioroebe/matplotlib/matplotlib_generator.rb +1 -1
  206. data/lib/bioroebe/misc/quiz/three_letter_to_aminoacid.rb +1 -1
  207. data/lib/bioroebe/misc/ruler.rb +5 -5
  208. data/lib/bioroebe/misc/useful_formulas.rb +3 -3
  209. data/lib/bioroebe/ncbi/efetch.rb +1 -2
  210. data/lib/bioroebe/ngs/phred_quality_score_table.rb +3 -3
  211. data/lib/bioroebe/nucleotides/complementary_dna_strand.rb +3 -6
  212. data/lib/bioroebe/nucleotides/molecular_weight_of_nucleotides.rb +3 -3
  213. data/lib/bioroebe/nucleotides/most_likely_nucleotide_sequence_for_this_aminoacid_sequence.rb +6 -10
  214. data/lib/bioroebe/nucleotides/{show_nucleotide_sequence.rb → show_nucleotide_sequence/show_nucleotide_sequence.rb} +377 -255
  215. data/lib/bioroebe/palindromes/palindrome_2D_structure.rb +1 -1
  216. data/lib/bioroebe/palindromes/palindrome_finder.rb +1 -1
  217. data/lib/bioroebe/palindromes/palindrome_generator.rb +2 -10
  218. data/lib/bioroebe/parsers/biolang_parser.rb +1 -1
  219. data/lib/bioroebe/parsers/blosum_parser.rb +14 -19
  220. data/lib/bioroebe/parsers/genbank_parser.rb +2 -6
  221. data/lib/bioroebe/parsers/gff.rb +9 -9
  222. data/lib/bioroebe/parsers/parse_embl.rb +2 -6
  223. data/lib/bioroebe/parsers/stride_parser.rb +4 -12
  224. data/lib/bioroebe/patterns/analyse_glycosylation_pattern.rb +2 -2
  225. data/lib/bioroebe/patterns/is_this_sequence_a_EGF2_pattern.rb +6 -3
  226. data/lib/bioroebe/patterns/profile_pattern.rb +2 -2
  227. data/lib/bioroebe/patterns/rgg_scanner.rb +4 -2
  228. data/lib/bioroebe/{protein_structure → pdb_and_protein_structure}/alpha_helix.rb +2 -2
  229. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/download_this_pdb.rb +2 -3
  230. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/fetch_fasta_sequence_from_pdb.rb +4 -4
  231. data/lib/bioroebe/{protein_structure → pdb_and_protein_structure}/helical_wheel.rb +2 -2
  232. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/parse_mmCIF_file.rb +1 -1
  233. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/parse_pdb_file.rb +3 -3
  234. data/lib/bioroebe/{pdb → pdb_and_protein_structure}/report_secondary_structures_from_this_pdb_file.rb +3 -3
  235. data/lib/bioroebe/project/project.rb +3 -1
  236. data/lib/bioroebe/raw_sequence/README.md +8 -8
  237. data/lib/bioroebe/raw_sequence/raw_sequence.rb +11 -2
  238. data/lib/bioroebe/regexes/regexes.rb +1 -2
  239. data/lib/bioroebe/requires/commandline_application.rb +3 -1
  240. data/lib/bioroebe/requires/require_all_pdb_files.rb +1 -1
  241. data/lib/bioroebe/requires/require_all_taxonomy_files.rb +1 -1
  242. data/lib/bioroebe/requires/require_all_utility_scripts_files.rb +10 -0
  243. data/lib/bioroebe/requires/require_colours.rb +1 -1
  244. data/lib/bioroebe/requires/require_the_bioroebe_project.rb +5 -7
  245. data/lib/bioroebe/requires/require_the_bioroebe_sinatra_components.rb +1 -1
  246. data/lib/bioroebe/requires/require_the_constants.rb +2 -14
  247. data/lib/bioroebe/requires/require_yaml.rb +7 -5
  248. data/lib/bioroebe/sequence/alignment.rb +1 -1
  249. data/lib/bioroebe/sequence/dna.rb +4 -2
  250. data/lib/bioroebe/sequence/nucleotide_module/nucleotide_module.rb +22 -8
  251. data/lib/bioroebe/sequence/protein.rb +2 -2
  252. data/lib/bioroebe/sequence/reverse_complement.rb +3 -3
  253. data/lib/bioroebe/sequence/rna.rb +9 -8
  254. data/lib/bioroebe/sequence/sequence.rb +3 -3
  255. data/lib/bioroebe/shell/configuration/additionally_set_xorg_buffer.yml +0 -0
  256. data/lib/bioroebe/shell/configuration/may_we_show_the_startup_information.yml +0 -0
  257. data/lib/bioroebe/shell/configuration/upcase_nucleotides.yml +0 -0
  258. data/lib/bioroebe/shell/configuration/use_silent_startup.yml +1 -1
  259. data/lib/bioroebe/shell/help/class.rb +68 -19
  260. data/lib/bioroebe/shell/menu.rb +5244 -5322
  261. data/lib/bioroebe/shell/{readline/readline.rb → readline.rb} +1 -3
  262. data/lib/bioroebe/shell/shell.rb +11240 -453
  263. data/lib/bioroebe/siRNA/siRNA.rb +3 -3
  264. data/lib/bioroebe/{gui/shared_code/blosum_matrix_viewer/blosum_matrix_viewer_module.rb → sinatra/sinatra_interface.rb} +28 -19
  265. data/lib/bioroebe/{www/sinatra/sinatra.rb → sinatra/sinatra_wrapper.rb} +731 -754
  266. data/lib/bioroebe/string_matching/find_longest_substring.rb +2 -10
  267. data/lib/bioroebe/string_matching/find_longest_substring_via_LCS_algorithm.rb +4 -14
  268. data/lib/bioroebe/string_matching/hamming_distance.rb +11 -10
  269. data/lib/bioroebe/string_matching/levensthein.rb +5 -17
  270. data/lib/bioroebe/string_matching/simple_string_comparer.rb +48 -4
  271. data/lib/bioroebe/string_matching/smith_waterman.rb +11 -6
  272. data/lib/bioroebe/svg/glyph.rb +4 -1
  273. data/lib/bioroebe/svg/mini_feature.rb +1 -1
  274. data/lib/bioroebe/svg/page.rb +18 -7
  275. data/lib/bioroebe/svg/svgee.rb +22 -13
  276. data/lib/bioroebe/svg/track.rb +20 -4
  277. data/lib/bioroebe/taxonomy/chart.rb +2 -2
  278. data/lib/bioroebe/taxonomy/class_methods.rb +5 -6
  279. data/lib/bioroebe/taxonomy/constants.rb +1 -1
  280. data/lib/bioroebe/taxonomy/info/info.rb +1 -1
  281. data/lib/bioroebe/taxonomy/info/is_dna.rb +1 -1
  282. data/lib/bioroebe/taxonomy/interactive.rb +1 -2
  283. data/lib/bioroebe/taxonomy/menu.rb +1 -1
  284. data/lib/bioroebe/taxonomy/node.rb +1 -1
  285. data/lib/bioroebe/taxonomy/parse_fasta.rb +4 -2
  286. data/lib/bioroebe/taxonomy/shared.rb +5 -4
  287. data/lib/bioroebe/taxonomy/taxonomy.rb +2 -4
  288. data/lib/bioroebe/toplevel_methods/fasta_and_fastq.rb +3 -45
  289. data/lib/bioroebe/toplevel_methods/{is_on_roebe.rb → roebe.rb} +1 -11
  290. data/lib/bioroebe/toplevel_methods/taxonomy.rb +6 -12
  291. data/lib/bioroebe/toplevel_methods/toplevel_methods.rb +5568 -0
  292. data/lib/bioroebe/utility_scripts/align_open_reading_frames.rb +4 -3
  293. data/lib/bioroebe/utility_scripts/analyse_local_dataset.rb +2 -2
  294. data/lib/bioroebe/utility_scripts/check_for_mismatches/check_for_mismatches.rb +16 -9
  295. data/lib/bioroebe/utility_scripts/compacter/compacter.rb +4 -2
  296. data/lib/bioroebe/utility_scripts/compare_these_two_sequences_via_blosum.rb +119 -0
  297. data/lib/bioroebe/utility_scripts/compseq/compseq.rb +11 -9
  298. data/lib/bioroebe/utility_scripts/{consensus_sequence.rb → consensus_sequence/consensus_sequence.rb} +13 -4
  299. data/lib/bioroebe/utility_scripts/{create_batch_entrez_file.rb → create_batch_entrez_file/create_batch_entrez_file.rb} +5 -5
  300. data/lib/bioroebe/utility_scripts/{determine_antigenic_areas.rb → determine_antigenic_areas/determine_antigenic_areas.rb} +5 -5
  301. data/lib/bioroebe/utility_scripts/{determine_missing_nucleotides_percentage.rb → determine_missing_nucleotides_percentage/determine_missing_nucleotides_percentage.rb} +16 -15
  302. data/lib/bioroebe/utility_scripts/display_open_reading_frames/display_open_reading_frames.rb +7 -7
  303. data/lib/bioroebe/utility_scripts/display_open_reading_frames/misc.rb +1 -1
  304. data/lib/bioroebe/utility_scripts/display_open_reading_frames/report.rb +2 -0
  305. data/lib/bioroebe/utility_scripts/{dot_alignment.rb → dot_alignment/dot_alignment.rb} +3 -3
  306. data/lib/bioroebe/utility_scripts/{download_files_from_rebase.rb → download_files_from_rebase/download_files_from_rebase.rb} +5 -5
  307. data/lib/bioroebe/utility_scripts/fetch_data_from_uniprot/fetch_data_from_uniprot.rb +269 -0
  308. data/lib/bioroebe/utility_scripts/find_gene.rb +4 -2
  309. data/lib/bioroebe/utility_scripts/{mirror_repeat.rb → mirror_repeat/mirror_repeat.rb} +5 -5
  310. data/lib/bioroebe/utility_scripts/move_file_to_its_correct_location.rb +3 -3
  311. data/lib/bioroebe/utility_scripts/{parse_taxonomy.rb → parse_taxonomy/parse_taxonomy.rb} +15 -6
  312. data/lib/bioroebe/utility_scripts/{pathways.rb → pathways/pathways.rb} +4 -3
  313. data/lib/bioroebe/utility_scripts/{permutations.rb → permutations/permutations.rb} +3 -3
  314. data/lib/bioroebe/utility_scripts/punnet/punnet.rb +4 -2
  315. data/lib/bioroebe/utility_scripts/{show_this_dna_sequence.rb → show_this_dna_sequence/show_this_dna_sequence.rb} +1 -1
  316. data/lib/bioroebe/utility_scripts/showorf/showorf.rb +406 -10
  317. data/lib/bioroebe/version/version.rb +2 -2
  318. data/lib/bioroebe/viennarna/rnafold_wrapper.rb +5 -13
  319. data/lib/bioroebe/virus/individual_viruses/README.md +15 -0
  320. data/lib/bioroebe/virus/individual_viruses/tobacco_mosaic_virus.rb +40 -0
  321. data/lib/bioroebe/virus/virus.rb +76 -0
  322. data/lib/bioroebe/www/bioroebe.cgi +4 -3
  323. data/lib/bioroebe/www/embeddable_interface.rb +85 -49
  324. data/lib/bioroebe/yaml/agarose/agarose_concentrations.yml +6 -6
  325. data/lib/bioroebe/yaml/antisense/antisense.yml +2 -0
  326. data/lib/bioroebe/yaml/blosum/blosum50.yml +6 -0
  327. data/lib/bioroebe/yaml/blosum/blosum90.yml +2 -1
  328. data/lib/bioroebe/yaml/chromosomes/chromosome_numbers.yml +2 -2
  329. data/lib/bioroebe/yaml/configuration/temp_dir.yml +1 -1
  330. data/lib/bioroebe/yaml/consensus_sequences/consensus_sequences.yml +1 -0
  331. data/lib/bioroebe/yaml/enzymes/enzyme_classes.yml +7 -6
  332. data/lib/bioroebe/yaml/humans/human_chromosomes.yml +3 -3
  333. data/lib/bioroebe/yaml/mRNA/mRNA.yml +1 -5
  334. data/lib/bioroebe/yaml/nucleotides/abbreviations_for_nucleotides.yml +1 -0
  335. data/lib/bioroebe/yaml/nucleotides/nucleotide_density.yml +2 -1
  336. data/lib/bioroebe/yaml/promoters/35S.yml +3 -1
  337. data/lib/bioroebe/yaml/proteases/proteases.yml +3 -1
  338. data/lib/bioroebe/yaml/proteins/ubiquitin.yml +4 -1
  339. data/lib/bioroebe/yaml/restriction_enzymes/restriction_enzymes.yml +7 -7
  340. data/spec/testing_toplevel_method_editor.rb +1 -1
  341. data/spec/testing_toplevel_method_verbose.rb +1 -1
  342. data/test/testing_dna_to_rna_conversion.rb +1 -1
  343. metadata +127 -235
  344. data/doc/blosum.md +0 -5
  345. data/lib/bioroebe/base/commandline_application/aminoacids.rb +0 -33
  346. data/lib/bioroebe/base/commandline_application/directory.rb +0 -33
  347. data/lib/bioroebe/base/commandline_application/extract.rb +0 -22
  348. data/lib/bioroebe/base/commandline_application/misc.rb +0 -502
  349. data/lib/bioroebe/base/commandline_application/opn.rb +0 -47
  350. data/lib/bioroebe/base/commandline_application/reset.rb +0 -42
  351. data/lib/bioroebe/base/commandline_application/warnings.rb +0 -36
  352. data/lib/bioroebe/base/commandline_application/write_what_into.rb +0 -29
  353. data/lib/bioroebe/base/initialize.rb +0 -18
  354. data/lib/bioroebe/base/misc.rb +0 -129
  355. data/lib/bioroebe/base/namespace.rb +0 -16
  356. data/lib/bioroebe/base/prototype/e_and_ee.rb +0 -24
  357. data/lib/bioroebe/base/prototype/misc.rb +0 -114
  358. data/lib/bioroebe/base/prototype/mkdir.rb +0 -20
  359. data/lib/bioroebe/base/prototype/reset.rb +0 -36
  360. data/lib/bioroebe/colours/misc_colours.rb +0 -80
  361. data/lib/bioroebe/colours/rev.rb +0 -44
  362. data/lib/bioroebe/colours/sdir.rb +0 -21
  363. data/lib/bioroebe/colours/sfancy.rb +0 -21
  364. data/lib/bioroebe/colours/sfile.rb +0 -21
  365. data/lib/bioroebe/colours/simp.rb +0 -21
  366. data/lib/bioroebe/colours/swarn.rb +0 -29
  367. data/lib/bioroebe/constants/aminoacids_and_proteins.rb +0 -147
  368. data/lib/bioroebe/constants/carriage_return.rb +0 -14
  369. data/lib/bioroebe/constants/codon_tables.rb +0 -77
  370. data/lib/bioroebe/constants/database_constants.rb +0 -107
  371. data/lib/bioroebe/constants/files_and_directories.rb +0 -606
  372. data/lib/bioroebe/constants/misc.rb +0 -209
  373. data/lib/bioroebe/constants/newline.rb +0 -14
  374. data/lib/bioroebe/constants/nucleotides.rb +0 -121
  375. data/lib/bioroebe/constants/regex.rb +0 -28
  376. data/lib/bioroebe/constants/roebe.rb +0 -38
  377. data/lib/bioroebe/constants/row_terminator.rb +0 -16
  378. data/lib/bioroebe/constants/tabulator.rb +0 -14
  379. data/lib/bioroebe/constants/unicode.rb +0 -12
  380. data/lib/bioroebe/constants/urls.rb +0 -50
  381. data/lib/bioroebe/gui/gtk +0 -1
  382. data/lib/bioroebe/gui/gtk3/README.md +0 -2
  383. data/lib/bioroebe/gui/gtk3/alignment/alignment.rb +0 -306
  384. data/lib/bioroebe/gui/gtk3/anti_sense_strand/anti_sense_strand.rb +0 -29
  385. data/lib/bioroebe/gui/gtk3/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -195
  386. data/lib/bioroebe/gui/gtk3/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +0 -105
  387. data/lib/bioroebe/gui/gtk3/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +0 -188
  388. data/lib/bioroebe/gui/gtk3/fasta_table_widget/fasta_table_widget.rb +0 -322
  389. data/lib/bioroebe/gui/gtk3/gene/gene.rb +0 -181
  390. data/lib/bioroebe/gui/gtk3/hamming_distance/hamming_distance.rb +0 -383
  391. data/lib/bioroebe/gui/gtk3/levensthein_distance/levensthein_distance.rb +0 -174
  392. data/lib/bioroebe/gui/gtk3/protein_to_DNA/protein_to_DNA.rb +0 -181
  393. data/lib/bioroebe/gui/gtk3/show_codon_table/show_codon_table.rb +0 -101
  394. data/lib/bioroebe/gui/gtk3/show_codon_usage/show_codon_usage.rb +0 -145
  395. data/lib/bioroebe/gui/gtk3/three_to_one/title.rb +0 -23
  396. data/lib/bioroebe/gui/jruby/alignment/alignment.rb +0 -165
  397. data/lib/bioroebe/gui/jruby/aminoacid_composition/aminoacid_composition.rb +0 -166
  398. data/lib/bioroebe/gui/jruby/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -82
  399. data/lib/bioroebe/gui/libui/README.md +0 -4
  400. data/lib/bioroebe/gui/libui/alignment/alignment.rb +0 -116
  401. data/lib/bioroebe/gui/libui/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -112
  402. data/lib/bioroebe/gui/libui/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.rb +0 -60
  403. data/lib/bioroebe/gui/libui/controller/controller.rb +0 -116
  404. data/lib/bioroebe/gui/libui/dna_to_aminoacid_widget/dna_to_aminoacid_widget.rb +0 -161
  405. data/lib/bioroebe/gui/libui/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.rb +0 -76
  406. data/lib/bioroebe/gui/libui/hamming_distance/hamming_distance.rb +0 -135
  407. data/lib/bioroebe/gui/libui/levensthein_distance/levensthein_distance.rb +0 -118
  408. data/lib/bioroebe/gui/libui/protein_to_DNA/protein_to_DNA.rb +0 -115
  409. data/lib/bioroebe/gui/libui/random_sequence/random_sequence.rb +0 -190
  410. data/lib/bioroebe/gui/libui/show_codon_table/show_codon_table.rb +0 -134
  411. data/lib/bioroebe/gui/libui/show_codon_usage/show_codon_usage.rb +0 -89
  412. data/lib/bioroebe/gui/libui/three_to_one/three_to_one.rb +0 -113
  413. data/lib/bioroebe/gui/shared_code/alignment/alignment_module.rb +0 -102
  414. data/lib/bioroebe/gui/shared_code/aminoacid_composition/aminoacid_composition_module.rb +0 -94
  415. data/lib/bioroebe/gui/shared_code/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria_module.rb +0 -216
  416. data/lib/bioroebe/gui/shared_code/protein_to_DNA/protein_to_DNA_module.rb +0 -192
  417. data/lib/bioroebe/gui/shared_code/show_codon_table/show_codon_table_module.rb +0 -72
  418. data/lib/bioroebe/gui/tk/aminoacid_composition/aminoacid_composition.rb +0 -206
  419. data/lib/bioroebe/gui/tk/blosum_matrix_viewer/blosum_matrix_viewer.rb +0 -140
  420. data/lib/bioroebe/gui/tk/hamming_distance/hamming_distance.rb +0 -262
  421. data/lib/bioroebe/gui/tk/levensthein_distance/levensthein_distance.rb +0 -243
  422. data/lib/bioroebe/gui/tk/three_to_one/three_to_one.rb +0 -199
  423. data/lib/bioroebe/gui/unified_widgets/anti_sense_strand/anti_sense_strand.rb +0 -519
  424. data/lib/bioroebe/shell/colours/colours.rb +0 -235
  425. data/lib/bioroebe/shell/help/help.rb +0 -25
  426. data/lib/bioroebe/shell/misc.rb +0 -10227
  427. data/lib/bioroebe/toplevel_methods/ad_hoc_task.rb +0 -56
  428. data/lib/bioroebe/toplevel_methods/aminoacids_and_proteins.rb +0 -722
  429. data/lib/bioroebe/toplevel_methods/atomic_composition.rb +0 -198
  430. data/lib/bioroebe/toplevel_methods/base_composition.rb +0 -121
  431. data/lib/bioroebe/toplevel_methods/blast.rb +0 -153
  432. data/lib/bioroebe/toplevel_methods/calculate_n50_value.rb +0 -57
  433. data/lib/bioroebe/toplevel_methods/cat.rb +0 -71
  434. data/lib/bioroebe/toplevel_methods/chunked_display.rb +0 -92
  435. data/lib/bioroebe/toplevel_methods/cliner.rb +0 -81
  436. data/lib/bioroebe/toplevel_methods/complement.rb +0 -58
  437. data/lib/bioroebe/toplevel_methods/convert_global_env.rb +0 -39
  438. data/lib/bioroebe/toplevel_methods/databases.rb +0 -73
  439. data/lib/bioroebe/toplevel_methods/delimiter.rb +0 -19
  440. data/lib/bioroebe/toplevel_methods/digest.rb +0 -81
  441. data/lib/bioroebe/toplevel_methods/download_and_fetch_data.rb +0 -146
  442. data/lib/bioroebe/toplevel_methods/e.rb +0 -20
  443. data/lib/bioroebe/toplevel_methods/editor.rb +0 -21
  444. data/lib/bioroebe/toplevel_methods/esystem.rb +0 -22
  445. data/lib/bioroebe/toplevel_methods/exponential_growth.rb +0 -74
  446. data/lib/bioroebe/toplevel_methods/extract.rb +0 -56
  447. data/lib/bioroebe/toplevel_methods/file_and_directory_related_actions.rb +0 -269
  448. data/lib/bioroebe/toplevel_methods/frequencies.rb +0 -99
  449. data/lib/bioroebe/toplevel_methods/hamming_distance.rb +0 -60
  450. data/lib/bioroebe/toplevel_methods/infer.rb +0 -66
  451. data/lib/bioroebe/toplevel_methods/leading_five_prime_and_trailing_three_prime.rb +0 -101
  452. data/lib/bioroebe/toplevel_methods/levensthein.rb +0 -63
  453. data/lib/bioroebe/toplevel_methods/log_directory.rb +0 -109
  454. data/lib/bioroebe/toplevel_methods/longest_common_substring.rb +0 -55
  455. data/lib/bioroebe/toplevel_methods/map_ncbi_entry_to_eutils_id.rb +0 -88
  456. data/lib/bioroebe/toplevel_methods/matches.rb +0 -259
  457. data/lib/bioroebe/toplevel_methods/misc.rb +0 -596
  458. data/lib/bioroebe/toplevel_methods/nucleotides.rb +0 -787
  459. data/lib/bioroebe/toplevel_methods/number_of_clones.rb +0 -63
  460. data/lib/bioroebe/toplevel_methods/open_in_browser.rb +0 -79
  461. data/lib/bioroebe/toplevel_methods/open_reading_frames.rb +0 -236
  462. data/lib/bioroebe/toplevel_methods/opn.rb +0 -34
  463. data/lib/bioroebe/toplevel_methods/palindromes.rb +0 -155
  464. data/lib/bioroebe/toplevel_methods/parse.rb +0 -59
  465. data/lib/bioroebe/toplevel_methods/phred_error_probability.rb +0 -68
  466. data/lib/bioroebe/toplevel_methods/rds.rb +0 -24
  467. data/lib/bioroebe/toplevel_methods/remove.rb +0 -86
  468. data/lib/bioroebe/toplevel_methods/return_source_code_of_this_method.rb +0 -35
  469. data/lib/bioroebe/toplevel_methods/return_subsequence_based_on_indices.rb +0 -68
  470. data/lib/bioroebe/toplevel_methods/rna_splicing.rb +0 -73
  471. data/lib/bioroebe/toplevel_methods/rnalfold.rb +0 -69
  472. data/lib/bioroebe/toplevel_methods/searching_and_finding.rb +0 -116
  473. data/lib/bioroebe/toplevel_methods/shuffleseq.rb +0 -37
  474. data/lib/bioroebe/toplevel_methods/statistics.rb +0 -53
  475. data/lib/bioroebe/toplevel_methods/sum_of_odd_integers.rb +0 -62
  476. data/lib/bioroebe/toplevel_methods/three_delimiter.rb +0 -34
  477. data/lib/bioroebe/toplevel_methods/time_and_date.rb +0 -53
  478. data/lib/bioroebe/toplevel_methods/to_camelcase.rb +0 -31
  479. data/lib/bioroebe/toplevel_methods/truncate.rb +0 -48
  480. data/lib/bioroebe/toplevel_methods/url.rb +0 -36
  481. data/lib/bioroebe/toplevel_methods/verbose.rb +0 -59
  482. data/lib/bioroebe/utility_scripts/showorf/constants.rb +0 -31
  483. data/lib/bioroebe/utility_scripts/showorf/help.rb +0 -33
  484. data/lib/bioroebe/utility_scripts/showorf/initialize.rb +0 -52
  485. data/lib/bioroebe/utility_scripts/showorf/menu.rb +0 -68
  486. data/lib/bioroebe/utility_scripts/showorf/reset.rb +0 -36
  487. data/lib/bioroebe/utility_scripts/showorf/run.rb +0 -152
  488. data/lib/bioroebe/utility_scripts/showorf/show.rb +0 -97
  489. /data/doc/{german_names_for_the_aminoacids.md → german_names_for_the_aminoacids/german_names_for_the_aminoacids.md} +0 -0
  490. /data/doc/{pdb_ATOM_entry.md → pdb_ATOM_entry/pdb_ATOM_entry.md} +0 -0
  491. /data/doc/{resources.md → resources/resources.md} +0 -0
  492. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/aminoacid_composition/customized_dialog.rb +0 -0
  493. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/anti_sense_strand/anti_sense_strand.config +0 -0
  494. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/calculate_cell_numbers_of_bacteria/calculate_cell_numbers_of_bacteria.config +0 -0
  495. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/dna_to_reverse_complement_widget/dna_to_reverse_complement_widget.config +0 -0
  496. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/hamming_distance/hamming_distance.config +0 -0
  497. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/levensthein_distance/levensthein_distance.config +0 -0
  498. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/protein_to_DNA/protein_to_DNA.config +0 -0
  499. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/restriction_enzymes/restriction_enzymes.config +0 -0
  500. /data/lib/bioroebe/gui/{gtk3 → universal_widgets}/www_finder/www_finder.config +0 -0
  501. /data/lib/bioroebe/yaml/{base_composition_of_dna.yml → base_composition_of_dna/base_composition_of_dna.yml} +0 -0
  502. /data/lib/bioroebe/yaml/{nuclear_localization_sequences.yml → nuclear_localization_sequences/nuclear_localization_sequences.yml} +0 -0
  503. /data/lib/bioroebe/yaml/{talens.yml → talens/talens.yml} +0 -0
@@ -1,596 +0,0 @@
1
- #!/usr/bin/ruby -w
2
- # Encoding: UTF-8
3
- # frozen_string_literal: true
4
- # =========================================================================== #
5
- # require 'bioroebe/toplevel_methods/misc.rb'
6
- # Bioroebe.reverse_sequence(ARGV)
7
- # Bioroebe.bisulfite_treatment(ARGV)
8
- # Bioroebe.return_DNA_composition_hash
9
- # =========================================================================== #
10
- module Bioroebe
11
-
12
- require 'bioroebe/encoding/encoding.rb'
13
- require 'bioroebe/toplevel_methods/aminoacids_and_proteins.rb'
14
- require 'bioroebe/toplevel_methods/e.rb'
15
- require 'bioroebe/toplevel_methods/esystem.rb'
16
- require 'bioroebe/toplevel_methods/extract.rb'
17
-
18
- # ========================================================================= #
19
- # === Bioroebe.percentage_count_non_DNA_bases_in_this_sequence
20
- #
21
- # Usage examples:
22
- #
23
- # Bioroebe.percentage_count_non_DNA_bases_in_this_sequence('ATCGF')
24
- # Bioroebe.percentage_count_non_DNA_bases_in_this_sequence('ACTNGTGCTYGATRGTAGC', %w( A T G C Y R ))
25
- #
26
- # ========================================================================= #
27
- def self.percentage_count_non_DNA_bases_in_this_sequence(
28
- i, array = Bioroebe.return_DNA_nucleotides
29
- )
30
- n = count_non_DNA_bases_in_this_sequence(i, array)
31
- percentage = (n * 100.0 / i.size.to_f)
32
- return percentage
33
- end
34
-
35
- # ========================================================================= #
36
- # === Bioroebe.count_non_DNA_bases_in_this_sequence
37
- #
38
- # Usage example:
39
- #
40
- # Bioroebe.count_non_DNA_bases_in_this_sequence('ATCGF')
41
- #
42
- # ========================================================================= #
43
- def self.count_non_DNA_bases_in_this_sequence(
44
- i, array = Bioroebe.return_DNA_nucleotides
45
- )
46
- i = i.dup
47
- array.each {|this_nucleotide|
48
- i.delete!(this_nucleotide)
49
- }
50
- return i.size
51
- end
52
-
53
- # ========================================================================= #
54
- # === Bioroebe.sequence_based_on_these_restriction_enzymes
55
- #
56
- # Usage example:
57
- #
58
- # x = Bioroebe.sequence_based_on_these_restriction_enzymes(%w( EcoRI SacI KpnI XmaI BamHI XbaI SalI )); 'GAATTCGAGCTCGGTACCCCCGGGGGATCCTCTAGAGTCGAC'
59
- #
60
- # ========================================================================= #
61
- def self.sequence_based_on_these_restriction_enzymes(*i)
62
- require 'bioroebe/enzymes/restriction_enzyme.rb'
63
- _ = ''.dup
64
- i.flatten.each {|this_restriction_enzyme|
65
- _ << ::Bioroebe.restriction_sites?(this_restriction_enzyme)
66
- }
67
- return _
68
- end
69
-
70
- # ========================================================================= #
71
- # === Bioroebe.create_jar_archive
72
- #
73
- # This method will create a .jar file.
74
- #
75
- # To invoke it from the commandline do:
76
- #
77
- # bioroebe --jar
78
- #
79
- # To execute a .jar file do:
80
- #
81
- # java -jar foobar.jar
82
- #
83
- # ========================================================================= #
84
- def self.create_jar_archive
85
- e 'Creating a .jar archive next:'
86
- e
87
- original_dir = return_pwd
88
- cd '/home/x/programming/ruby/src/bioroebe/lib/bioroebe/java/bioroebe/src/main/java/'
89
- esystem 'jar cf bioroebe.jar bioroebe/'
90
- target_file = File.absolute_path('bioroebe.jar')
91
- cd original_dir
92
- if File.exist? target_file
93
- e 'Moving the created .jar file into the current working '\
94
- 'directory next.'
95
- move_file(target_file, original_dir)
96
- e 'It should now be at:'
97
- e
98
- e sfile(" #{original_dir}#{File.basename(target_file)}")
99
- e
100
- end
101
- # esystem 'jar cfe bioroebe.jar myClass myClass.class'
102
- e
103
- end
104
-
105
- # ========================================================================= #
106
- # === Bioroebe.frequency_per_thousand
107
- #
108
- # The input to this method should be a String ideally. If an Array is
109
- # input then it will simply be .join()-ed.
110
- #
111
- # This method will return a String, if all goes well.
112
- # ========================================================================= #
113
- def self.frequency_per_thousand(i)
114
- result = "fields: [triplet] [frequency: per thousand] ([number])\n".dup # This String will be returned.
115
- if i.is_a? Array
116
- i = i.join
117
- end
118
- i.delete!("\n")
119
- hash = ::Bioroebe.codon_frequency_of_this_string(i)
120
- hash.default = 0
121
- total_n_elements = hash.values.sum
122
- append_this = <<-EOF
123
-
124
- UUU#{thousand_percentage(hash['UUU'], total_n_elements)}( #{hash['UUU']}) UCU#{thousand_percentage(hash['UCU'], total_n_elements)}( #{hash['UCU']}) UAU#{thousand_percentage(hash['UAU'], total_n_elements)}( #{hash['UAU']}) UGU#{thousand_percentage(hash['UGU'], total_n_elements)}( #{hash['UGU']})
125
- UUC#{thousand_percentage(hash['UUC'], total_n_elements)}( #{hash['UUC']}) UCC#{thousand_percentage(hash['UCC'], total_n_elements)}( #{hash['UCC']}) UAC#{thousand_percentage(hash['UAC'], total_n_elements)}( #{hash['UAC']}) UGC#{thousand_percentage(hash['UGC'], total_n_elements)}( #{hash['UGC']})
126
- UUA#{thousand_percentage(hash['UUA'], total_n_elements)}( #{hash['UUA']}) UCA#{thousand_percentage(hash['UCA'], total_n_elements)}( #{hash['UCA']}) UAA#{thousand_percentage(hash['UAA'], total_n_elements)}( #{hash['UAA']}) UGA#{thousand_percentage(hash['UGA'], total_n_elements)}( #{hash['UGA']})
127
- UUG#{thousand_percentage(hash['UUG'], total_n_elements)}( #{hash['UUG']}) UCG#{thousand_percentage(hash['UCG'], total_n_elements)}( #{hash['UCG']}) UAG#{thousand_percentage(hash['UAG'], total_n_elements)}( #{hash['UAG']}) UGG#{thousand_percentage(hash['UGG'], total_n_elements)}( #{hash['UGG']})
128
-
129
- CUU#{thousand_percentage(hash['CUU'], total_n_elements)}( #{hash['CUU']}) CCU#{thousand_percentage(hash['CCU'], total_n_elements)}( #{hash['CCU']}) CAU#{thousand_percentage(hash['CAU'], total_n_elements)}( #{hash['CAU']}) CGU#{thousand_percentage(hash['CGU'], total_n_elements)}( #{hash['CGU']})
130
- CUC#{thousand_percentage(hash['CUC'], total_n_elements)}( #{hash['CUC']}) CCC#{thousand_percentage(hash['CCC'], total_n_elements)}( #{hash['CCC']}) CAC#{thousand_percentage(hash['CAC'], total_n_elements)}( #{hash['CAC']}) CGC#{thousand_percentage(hash['CGC'], total_n_elements)}( #{hash['CGC']})
131
- CUA#{thousand_percentage(hash['CUA'], total_n_elements)}( #{hash['CUA']}) CCA#{thousand_percentage(hash['CCA'], total_n_elements)}( #{hash['CCA']}) CAA#{thousand_percentage(hash['CAA'], total_n_elements)}( #{hash['CAA']}) CGA#{thousand_percentage(hash['CGA'], total_n_elements)}( #{hash['CGA']})
132
- CUG#{thousand_percentage(hash['CUG'], total_n_elements)}( #{hash['CUG']}) CCG#{thousand_percentage(hash['CCG'], total_n_elements)}( #{hash['CCG']}) CAG#{thousand_percentage(hash['CAG'], total_n_elements)}( #{hash['CAG']}) CGG#{thousand_percentage(hash['CGG'], total_n_elements)}( #{hash['CGG']})
133
-
134
- AUU#{thousand_percentage(hash['AUU'], total_n_elements)}( #{hash['AUU']}) ACU#{thousand_percentage(hash['ACU'], total_n_elements)}( #{hash['ACU']}) AAU#{thousand_percentage(hash['AAU'], total_n_elements)}( #{hash['AAU']}) AGU#{thousand_percentage(hash['AGU'], total_n_elements)}( #{hash['AGU']})
135
- AUC#{thousand_percentage(hash['AUC'], total_n_elements)}( #{hash['AUC']}) ACC#{thousand_percentage(hash['ACC'], total_n_elements)}( #{hash['ACC']}) AAC#{thousand_percentage(hash['AAC'], total_n_elements)}( #{hash['AAC']}) AGC#{thousand_percentage(hash['AGC'], total_n_elements)}( #{hash['AGC']})
136
- AUA#{thousand_percentage(hash['AUA'], total_n_elements)}( #{hash['AUA']}) ACA#{thousand_percentage(hash['ACA'], total_n_elements)}( #{hash['ACA']}) AAA#{thousand_percentage(hash['AAA'], total_n_elements)}( #{hash['AAA']}) AGA#{thousand_percentage(hash['AGA'], total_n_elements)}( #{hash['AGA']})
137
- AUG#{thousand_percentage(hash['AUG'], total_n_elements)}( #{hash['AUG']}) ACG#{thousand_percentage(hash['ACG'], total_n_elements)}( #{hash['ACG']}) AAG#{thousand_percentage(hash['AAG'], total_n_elements)}( #{hash['AAG']}) AGG#{thousand_percentage(hash['AGG'], total_n_elements)}( #{hash['AGG']})
138
-
139
- GUU#{thousand_percentage(hash['GUU'], total_n_elements)}( #{hash['GUU']}) GCU#{thousand_percentage(hash['GCU'], total_n_elements)}( #{hash['GCU']}) GAU#{thousand_percentage(hash['GAU'], total_n_elements)}( #{hash['GAU']}) GGU#{thousand_percentage(hash['GGU'], total_n_elements)}( #{hash['GGU']})
140
- GUC#{thousand_percentage(hash['GUC'], total_n_elements)}( #{hash['GUC']}) GCC#{thousand_percentage(hash['GCC'], total_n_elements)}( #{hash['GCC']}) GAC#{thousand_percentage(hash['GAC'], total_n_elements)}( #{hash['GAC']}) GGC#{thousand_percentage(hash['GGC'], total_n_elements)}( #{hash['GGC']})
141
- GUA#{thousand_percentage(hash['GUA'], total_n_elements)}( #{hash['GUA']}) GCA#{thousand_percentage(hash['GCA'], total_n_elements)}( #{hash['GCA']}) GAA#{thousand_percentage(hash['GAA'], total_n_elements)}( #{hash['GAA']}) GGA#{thousand_percentage(hash['GGA'], total_n_elements)}( #{hash['GGA']})
142
- GUG#{thousand_percentage(hash['GUG'], total_n_elements)}( #{hash['GUG']}) GCG#{thousand_percentage(hash['GCG'], total_n_elements)}( #{hash['GCG']}) GAG#{thousand_percentage(hash['GAG'], total_n_elements)}( #{hash['GAG']}) GGG#{thousand_percentage(hash['GGG'], total_n_elements)}( #{hash['GGG']})
143
- EOF
144
- result << append_this
145
- return result
146
- end
147
-
148
- # ========================================================================= #
149
- # === Bioroebe.codon_frequency_of_this_string
150
- #
151
- # The input to this method should ideally be a String. It will be assumed
152
- # to be a RNA string, e. g. mRNA. Thus, all T are replaced with U by
153
- # default. This can be toggled via the second argument of this method.
154
- #
155
- # This method will return a Hash.
156
- #
157
- # Usage example:
158
- #
159
- # Bioroebe.codon_frequency_of_this_string
160
- # Bioroebe.codon_frequency_of_this_string 'ATTCGTACGATCGACTACTACT' # => {"UAC"=>2, "GAC"=>1, "AUC"=>1, "ACG"=>1, "CGU"=>1, "AUU"=>1}
161
- #
162
- # ========================================================================= #
163
- def self.codon_frequency_of_this_string(
164
- i = 'ATTCGTACGATCGACTGACTGACAGTCATTCGTAGTACGATCGACTGACTGACAGTCATTCGTAC'\
165
- 'GATCGACTGACTGACAAGTCATTCGTACGATCGACTGACTTGACAGTCATAA',
166
- automatically_convert_into_a_RNA_sequence = true
167
- )
168
- i = i.join if i.is_a? Array
169
- if automatically_convert_into_a_RNA_sequence
170
- i = i.dup if i.frozen?
171
- i.tr!('T','U')
172
- end
173
- scanned = i.scan(/.../)
174
- tally = scanned.tally
175
- # ======================================================================= #
176
- # We still have to sort it.
177
- # ======================================================================= #
178
- sorted_hash = Hash[tally.sort_by {|key, value| value }.reverse]
179
- return sorted_hash
180
- end
181
-
182
- # ========================================================================= #
183
- # === Bioroebe.thousand_percentage
184
- #
185
- # This method is solely a helper-method for Bioroebe.frequency_per_thousand().
186
- # ========================================================================= #
187
- def self.thousand_percentage(
188
- this_codon_n_times = 1,
189
- total_n_elements = 1000
190
- )
191
- result = (
192
- (this_codon_n_times * 1000.0) / total_n_elements.to_f
193
- ).round(1)
194
- padded_result = result.to_s.rjust(5, ' ')
195
- return padded_result
196
- end
197
-
198
- # ========================================================================= #
199
- # === Bioroebe.align_this_string_via_multiple_sequence_alignment
200
- #
201
- # This method will simply return an Array.
202
- # ========================================================================= #
203
- def self.align_this_string_via_multiple_sequence_alignment(
204
- this_string =
205
- "PSRARRDAVG--DH--PAVEALP----PQSGPHKKEISFFTVRKEEAADADLWFPS
206
- PGGASK--VGQTDNDPQAIKDLP----PQGED------------------------
207
- "
208
- )
209
- if this_string.is_a? Array
210
- this_string = this_string.join("\n")
211
- end
212
- this_string = this_string.dup if this_string.frozen?
213
- this_string.strip!
214
- this_string.delete!(' ')
215
- splitted = this_string.split("\n")
216
- return splitted
217
- end
218
-
219
- # ========================================================================= #
220
- # === Bioroebe.quaternary_encoding_translate_from_alphabet_string_into_the_corresponding_DNA_sequence
221
- #
222
- # Usage example:
223
- #
224
- # Bioroebe.quaternary_encoding_translate_from_alphabet_string_into_the_corresponding_DNA_sequence('OTTO')
225
- #
226
- # ========================================================================= #
227
- def self.quaternary_encoding_translate_from_alphabet_string_into_the_corresponding_DNA_sequence(
228
- this_string = 'Hello world'
229
- )
230
- _ = ''.dup
231
- chars = this_string.chars
232
- chars.each {|this_char|
233
- case chars
234
- when ' ','!','?'
235
- # pass through in this case.
236
- else
237
- this_char = this_char.upcase
238
- _ << Bioroebe.quaternary_encoding_letter_to_number(this_char)
239
- end
240
- }
241
- return _
242
- end
243
-
244
- # ========================================================================= #
245
- # === Bioroebe.quaternary_encoding_DNA_to_numbers
246
- #
247
- # You can pass in another hash as the second argument to this method,
248
- # if you'd like to.
249
- #
250
- # Usage example:
251
- #
252
- # Bioroebe.quaternary_encoding_DNA_to_numbers('TACATCTTTCGATCGATCGG') # => "10201211123012301233"
253
- #
254
- # ========================================================================= #
255
- def self.quaternary_encoding_DNA_to_numbers(
256
- i = 'TACATCTTTCGATCGATCGG',
257
- hash = { A: 0, T: 1, C: 2, G: 3 }
258
- )
259
- i = i.chars unless i.is_a? Array
260
- return i.map {|entry|
261
- hash[entry.to_sym]
262
- }.join
263
- end
264
-
265
- # ========================================================================= #
266
- # === Bioroebe.quaternary_encoding_letter_to_number
267
- # ========================================================================= #
268
- def self.quaternary_encoding_letter_to_number(
269
- letter,
270
- use_this_hash = {
271
- '0000': :A,
272
- '1000': :B,
273
- '2000': :C,
274
- '3000': :D,
275
- '0100': :E,
276
- '0200': :F,
277
- '0300': :G,
278
- '0010': :H,
279
- '0020': :I,
280
- '0030': :J,
281
- '0001': :K,
282
- '0002': :L,
283
- '0003': :M,
284
- '1100': :N,
285
- '1200': :O,
286
- '1300': :P,
287
- '1110': :Q,
288
- '1120': :R,
289
- '1130': :S,
290
- '1210': :T,
291
- '1220': :U,
292
- '1230': :V,
293
- '1231': :W
294
- })
295
- use_this_hash = use_this_hash.invert
296
- return use_this_hash[letter.to_sym].to_s
297
- end
298
-
299
- # ========================================================================= #
300
- # === Bioroebe.quaternary_encoding_number_to_letter
301
- # ========================================================================= #
302
- def self.quaternary_encoding_number_to_letter(
303
- number,
304
- use_this_hash = {
305
- '0000': :A,
306
- '1000': :B,
307
- '2000': :C,
308
- '3000': :D,
309
- '0100': :E,
310
- '0200': :F,
311
- '0300': :G,
312
- '0010': :H,
313
- '0020': :I,
314
- '0030': :J,
315
- '0001': :K,
316
- '0002': :L,
317
- '0003': :M,
318
- '1100': :N,
319
- '1200': :O,
320
- '1300': :P,
321
- '1110': :Q,
322
- '1120': :R,
323
- '1130': :S,
324
- '1210': :T,
325
- '1220': :U,
326
- '1230': :V,
327
- '1231': :W
328
- })
329
- return use_this_hash[number.to_s].to_s
330
- end
331
-
332
- # ========================================================================= #
333
- # === Bioroebe.quaternary_encoding_numbers_to_DNA
334
- # ========================================================================= #
335
- def self.quaternary_encoding_numbers_to_DNA(
336
- i = '10201211123012301233',
337
- hash = { A: 0, T: 1, C: 2, G: 3 }
338
- )
339
- i = i.chars unless i.is_a? Array
340
- inverted_hash = hash.invert
341
- return i.map {|number|
342
- inverted_hash[number.to_i]
343
- }.join
344
- end
345
-
346
- # ========================================================================= #
347
- # === Bioroebe.download_human_genome
348
- # ========================================================================= #
349
- def self.download_human_genome(
350
- from_this_URL = 'https://bioconductor.org/packages/release/data/annotation/src/contrib/BSgenome.Hsapiens.UCSC.hg38_1.4.4.tar.gz'
351
- )
352
- esystem "wget #{from_this_URL}"
353
- extract(
354
- File.basename(from_this_URL)
355
- )
356
- end
357
-
358
- # ========================================================================= #
359
- # === Bioroebe.guess_format
360
- # ========================================================================= #
361
- def self.guess_format(i)
362
- case i
363
- # ======================================================================= #
364
- # === fasta
365
- # ======================================================================= #
366
- when /.fa$/,
367
- /.fna$/,
368
- /.faa$/,
369
- /.fasta$/
370
- 'fasta'
371
- # ======================================================================= #
372
- # === fastq
373
- # ======================================================================= #
374
- when /.fq$/,
375
- /.fastq$/
376
- 'fastq'
377
- when /.fx/
378
- ''
379
- end
380
- end
381
-
382
- # ========================================================================= #
383
- # === Bioroebe.return_ubiquitin_sequence
384
- #
385
- # This method will simply return the Ubiquitin sequence. We may also
386
- # colourize some aminoacids, if we have enabled this.
387
- # ========================================================================= #
388
- def self.return_ubiquitin_sequence(
389
- i = 'MQIFVKTLTGKTITLEVEPSDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQKESTLHLVLRLRGG'
390
- )
391
- colourize_aa(i) # Consider colourizing it.
392
- end; self.instance_eval { alias ubiquitin return_ubiquitin_sequence } # === Bioroebe.ubiquitin
393
-
394
- # ========================================================================= #
395
- # === Bioroebe.reverse_sequence
396
- # ========================================================================= #
397
- def self.reverse_sequence(i)
398
- i = i.first if i.is_a? Array
399
- i.reverse
400
- end
401
-
402
- # ========================================================================= #
403
- # === Bioroebe.bisulfite_treatment
404
- #
405
- # Simply convert all C into U. The underlying idea here is that
406
- # bilsufite will convert unmethylated Cytosines into Uracil.
407
- #
408
- # Usage example:
409
- #
410
- # Bioroebe.bisulfite_treatment('CCCGCAATGCATACCTCGCCG') # => "UUUGUAATGUATAUUTUGUUG"
411
- #
412
- # ========================================================================= #
413
- def self.bisulfite_treatment(i)
414
- if i.is_a? Array
415
- i = i.join('').strip
416
- end
417
- i.tr('C','U')
418
- end; self.instance_eval { alias bisulfie bisulfite_treatment } # === Bioroebe.bisulfite
419
-
420
- # ========================================================================= #
421
- # === Bioroebe.batch_create_windows_executables
422
- #
423
- # This method is only useful for windows. We will use "ocra" to create
424
- # various .exe files that have the desired widgt-functionality.
425
- #
426
- # Note that the functionality depends on the roebe-gem.
427
- # ========================================================================= #
428
- def self.batch_create_windows_executables
429
- begin
430
- require 'roebe/custom_methods/custom_methods.rb'
431
- rescue LoadError; end
432
- array_these_files = %w(
433
- /home/x/programming/ruby/src/bioroebe/lib/bioroebe/gui/libui/hamming_distance/hamming_distance.rb
434
- )
435
- array_these_files.each {|this_file|
436
- Roebe.ocra_build(
437
- this_file,
438
- File.basename(this_file).delete_suffix('.rb')
439
- )
440
- }
441
- end
442
-
443
- # ========================================================================= #
444
- # === Bioroebe.create_the_pdf_tutorial
445
- #
446
- # This method can be used to quickly turn the README.md file into
447
- # a .pdf file, for whatever the reason the user may want this.
448
- # ========================================================================= #
449
- def self.create_the_pdf_tutorial(
450
- read_from_this_file = '/home/x/programming/ruby/src/bioroebe/README.md',
451
- store_where = '/Depot/j/example.pdf'
452
- )
453
-
454
- require 'prawn'
455
-
456
- Prawn::Fonts::AFM.hide_m17n_warning = true # Hide a useless warning.
457
-
458
- pdf = Prawn::Document.new(
459
- page_size: 'A4',
460
- page_layout: :landscape
461
- )
462
- pdf.text "The Bioroebe Project", size: 80
463
- pdf.start_new_page
464
- pdf.bounding_box [50, 600], width: 200 do
465
- pdf.fill_color '000000'
466
- pdf.text "making bioinformatics great again:", size: 15
467
- end
468
- pdf.start_new_page
469
- dataset = File.read(read_from_this_file, encoding: UTF_ENCODING)
470
- dataset = dataset.encode("Windows-1252", invalid: :replace, undef: :replace)
471
-
472
- pdf.text(dataset)
473
- e 'Storing at this location: '+store_where
474
- pdf.render_file store_where
475
- end; self.instance_eval { alias pdf create_the_pdf_tutorial } # === Bioroebe.pdf
476
-
477
- # ========================================================================= #
478
- # === Bioroebe.return_DNA_composition_hash
479
- # ========================================================================= #
480
- def self.return_DNA_composition_hash(
481
- of_this_sequence
482
- )
483
- of_this_sequence = of_this_sequence.first if of_this_sequence.is_a? Array
484
- hash = {}
485
- array1 = %w( A T C G )
486
- array2 = Array.new(array1.size, 0)
487
- array = array1.zip(array2) # Zip it up with 0-values here.
488
- hash = Hash[array]
489
- of_this_sequence.chars.each {|this_char|
490
- hash[this_char] += 1
491
- }
492
- sorted_hash = Hash[*hash.sort_by {|key, value|
493
- key
494
- }.flatten]
495
- # ======================================================================= #
496
- # The hash may then look like this:
497
- #
498
- # {"A"=>7, "T"=>6, "C"=>7, "G"=>6}
499
- #
500
- # ======================================================================= #
501
- return sorted_hash
502
- end
503
-
504
- # ========================================================================= #
505
- # === Bioroebe.windows_platform?
506
- # ========================================================================= #
507
- def self.windows_platform?
508
- case RUBY_PLATFORM
509
- when /(?:mswin|bccwin|mingw|windows)(?:32|64)/i
510
- true
511
- else
512
- false
513
- end
514
- end; self.instance_eval { alias on_windows? windows_platform? } # === Bioroebe.on_windows?
515
- self.instance_eval { alias is_on_windows? windows_platform? } # === Bioroebe.is_on_windows?
516
-
517
- # ========================================================================= #
518
- # === Bioroebe.two_dimensional_plot
519
- #
520
- # This method makes use of gnuplot to draw a 2D plot.
521
- #
522
- # The first argument should contain your dataset, as a String.
523
- # ========================================================================= #
524
- def self.two_dimensional_plot(
525
- dataset = '6 12
526
- 8 14
527
- 10 18
528
- 12 23
529
- 14 28
530
- 16 29
531
- 18 26
532
- 20 23
533
- 22 20',
534
- optional_hash = {
535
- width: 800,
536
- height: 640
537
- }
538
- )
539
- # ======================================================================= #
540
- # Provide some generic fall-back values for width and height next:
541
- # ======================================================================= #
542
- width = 1000
543
- height = 800
544
- _ = optional_hash
545
- if _.is_a? Hash
546
- # ===================================================================== #
547
- # === :width
548
- # ===================================================================== #
549
- if _.has_key? :width
550
- width = _.delete(:width)
551
- end
552
- # ===================================================================== #
553
- # === :height
554
- # ===================================================================== #
555
- if _.has_key? :height
556
- height = _.delete(:height)
557
- end
558
- end
559
- # ======================================================================= #
560
- # Go to a safe base directory.
561
- # ======================================================================= #
562
- cd :bioroebe_log_directory
563
- mkdir 'gnuplot' unless File.directory?('gnuplot')
564
- cd 'gnuplot'
565
- # ======================================================================= #
566
- # First save the dataset into dataset.md:
567
- # ======================================================================= #
568
- into = File.absolute_path('dataset.md')
569
- e 'Storing the dataset into '+sfile(into)+' next.'
570
- write_what_into(dataset, into)
571
- what = <<-EOF
572
-
573
- set terminal png size #{width},#{height} enhanced font "Helvetica, 18"
574
- set output 'fancy_graph.png'
575
- plot '#{into}' with linespoints ls 1 notitle
576
-
577
- EOF
578
- into = File.absolute_path('gnuplot.file')
579
- e 'Storing into '+into+'.'
580
- write_what_into(what, into)
581
- esystem 'gnuplot '+into
582
- if File.exist? 'fancy_graph.png' and is_on_roebe?
583
- Open.in_browser('fancy_graph.png')
584
- end
585
- end
586
-
587
- end
588
-
589
- if __FILE__ == $PROGRAM_NAME
590
- puts Bioroebe.reverse_sequence(ARGV)
591
- puts Bioroebe.bisulfite_treatment('CCCGCAATGCATACCTCGCCG')
592
- puts Bioroebe.return_ubiquitin_sequence
593
- pp Bioroebe.return_DNA_composition_hash(ARGV)
594
- end # rb misc ATGC # => CGTA
595
- # rb misc.rb GATCTGCAGTACGTACGTACTGACAC
596
- # returnubiquitinsequence